[igt-dev] [PATCH i-g-t v2 2/6] lib: Add i915_perf library

Lionel Landwerlin lionel.g.landwerlin at intel.com
Tue Feb 18 22:56:16 UTC 2020


This library contains the database of performance metrics for each
supported generation as well as its associated programming.

It also allow for the user to get human readable data out of HW
generated data.

Signed-off-by: Lionel Landwerlin <lionel.g.landwerlin at intel.com>
Acked-by: Chris Wilson <chris at chris-wilson.co.uk>
---
 lib/i915-perf.pc.in                        |    10 +
 lib/i915/perf-configs/README.md            |   115 +
 lib/i915/perf-configs/codegen.py           |    33 +
 lib/i915/perf-configs/guids.xml            |   319 +
 lib/i915/perf-configs/mdapi-xml-convert.py |  1006 ++
 lib/i915/perf-configs/oa-bdw.xml           | 15653 +++++++++++++++++++
 lib/i915/perf-configs/oa-bxt.xml           |  9595 ++++++++++++
 lib/i915/perf-configs/oa-cflgt2.xml        | 10866 +++++++++++++
 lib/i915/perf-configs/oa-cflgt3.xml        | 10933 +++++++++++++
 lib/i915/perf-configs/oa-chv.xml           |  9757 ++++++++++++
 lib/i915/perf-configs/oa-cnl.xml           | 10411 ++++++++++++
 lib/i915/perf-configs/oa-glk.xml           |  9346 +++++++++++
 lib/i915/perf-configs/oa-hsw.xml           |  4615 ++++++
 lib/i915/perf-configs/oa-icl.xml           | 11869 ++++++++++++++
 lib/i915/perf-configs/oa-kblgt2.xml        | 10866 +++++++++++++
 lib/i915/perf-configs/oa-kblgt3.xml        | 10933 +++++++++++++
 lib/i915/perf-configs/oa-lkf.xml           | 11803 ++++++++++++++
 lib/i915/perf-configs/oa-sklgt2.xml        | 11895 ++++++++++++++
 lib/i915/perf-configs/oa-sklgt3.xml        | 10933 +++++++++++++
 lib/i915/perf-configs/oa-sklgt4.xml        | 10956 +++++++++++++
 lib/i915/perf-configs/oa-tgl.xml           |  8491 ++++++++++
 lib/i915/perf-configs/oa_guid_registry.py  |    73 +
 lib/i915/perf-configs/perf-codegen.py      |   850 +
 lib/i915/perf-configs/update-guids.py      |   231 +
 lib/i915/perf.c                            |   424 +
 lib/i915/perf.h                            |   227 +
 lib/meson.build                            |    65 +
 tools/i915-perf/i915_perf_configs.c        |   277 +
 tools/i915-perf/meson.build                |     5 +
 tools/meson.build                          |     1 +
 30 files changed, 172558 insertions(+)
 create mode 100644 lib/i915-perf.pc.in
 create mode 100644 lib/i915/perf-configs/README.md
 create mode 100644 lib/i915/perf-configs/codegen.py
 create mode 100644 lib/i915/perf-configs/guids.xml
 create mode 100755 lib/i915/perf-configs/mdapi-xml-convert.py
 create mode 100644 lib/i915/perf-configs/oa-bdw.xml
 create mode 100644 lib/i915/perf-configs/oa-bxt.xml
 create mode 100644 lib/i915/perf-configs/oa-cflgt2.xml
 create mode 100644 lib/i915/perf-configs/oa-cflgt3.xml
 create mode 100644 lib/i915/perf-configs/oa-chv.xml
 create mode 100644 lib/i915/perf-configs/oa-cnl.xml
 create mode 100644 lib/i915/perf-configs/oa-glk.xml
 create mode 100644 lib/i915/perf-configs/oa-hsw.xml
 create mode 100644 lib/i915/perf-configs/oa-icl.xml
 create mode 100644 lib/i915/perf-configs/oa-kblgt2.xml
 create mode 100644 lib/i915/perf-configs/oa-kblgt3.xml
 create mode 100644 lib/i915/perf-configs/oa-lkf.xml
 create mode 100644 lib/i915/perf-configs/oa-sklgt2.xml
 create mode 100644 lib/i915/perf-configs/oa-sklgt3.xml
 create mode 100644 lib/i915/perf-configs/oa-sklgt4.xml
 create mode 100644 lib/i915/perf-configs/oa-tgl.xml
 create mode 100644 lib/i915/perf-configs/oa_guid_registry.py
 create mode 100755 lib/i915/perf-configs/perf-codegen.py
 create mode 100755 lib/i915/perf-configs/update-guids.py
 create mode 100644 lib/i915/perf.c
 create mode 100644 lib/i915/perf.h
 create mode 100644 tools/i915-perf/i915_perf_configs.c
 create mode 100644 tools/i915-perf/meson.build

diff --git a/lib/i915-perf.pc.in b/lib/i915-perf.pc.in
new file mode 100644
index 00000000..e72efdc3
--- /dev/null
+++ b/lib/i915-perf.pc.in
@@ -0,0 +1,10 @@
+prefix=@prefix@
+exec_prefix=@exec_prefix@
+libdir=@libdir@
+includedir=@includedir@
+
+Name: i915-perf
+Description: i915 perf library
+Version: @version@
+Libs: -L${libdir} -li915_perf
+Cflags: -I${includedir}/i915-perf
diff --git a/lib/i915/perf-configs/README.md b/lib/i915/perf-configs/README.md
new file mode 100644
index 00000000..df31d6ae
--- /dev/null
+++ b/lib/i915/perf-configs/README.md
@@ -0,0 +1,115 @@
+# About guids.xml
+
+This is the authoritive registry of unique identifers for different OA unit
+hardware configurations. Userspace can reliably use these identifiers to map a
+configuration to corresponding normalization equations and counter meta data.
+
+If a hardware configuration ever changes in a backwards incompatible way
+(changing the semantics and/or layout of the raw counters) then it must be
+given a new GUID.
+
+mdapi-xml-convert.py will match metric sets with a GUID from this file based on
+an md5 hash of the hardware register configuration and skip a metric set with a
+warning if no GUID could be found.
+
+All new metric sets need to be allocated a GUID here before
+mdapi-xml-convert.py or i915-perf-kernelgen.py will output anything for that
+metric set. This ensures we don't automatically import new metric sets without
+some explicit review that that's appropriate.
+
+A failure to find a GUID for an older metric set most likely implies that the
+register configuration was changed. It's possible that the change is benign
+(e.g. a comment change) and in that case the mdapi_config_hash for the
+corresponding metric set below can be updated.
+
+The update-guids.py script is the recommended way of managing updates to this
+file by generate a temporary file with proposed updates that you can compare
+with the current guids.xml.
+
+
+# update-guids.xml
+
+update-guids.py can help with:
+
+* Recognising new metrics from VPG's MDAPI XML files
+
+  *(NOTE: new guids.xml entries will initially be missing the
+  config_hash=MD5_HASH attribute until mdapi-xml-convert.py is used to generate
+  a corresponding oa-*.xml config description)*
+
+* Adding a config_hash=MD5_HASH attribute to recently added guids.xml entries
+  after mdapi-xml-convert.py has been run.
+
+* Allocating a GUID for a custom metric that doesn't have a counterpart in
+  VPG's MDAPI XML files.
+
+  For this case you can add a stub entry with only a name like `<guid
+  name="Foo">` to guids.xml and then running update-guids.py will output a
+  corresponding line with the addition of an id=UUID attribute.
+
+
+# How to sync the oa-\*.xml files with latest internal MDAPI XML files
+
+1. E.g. copy a new `MetricsXML_BDW.xml` to `mdapi/MetricsXML_BDW.xml`
+
+*Note: that the `mdapi-xml-convert.py` script will only convert configs that
+have a corresponding GUID entry within `guids.xml`. This check helps avoid
+unintentionally publishing early, work-in-progress/pre-production configs.*
+
+The `guids.xml` registry maps each, complex OA unit register configuration to a
+unique ID that userspace can recognise and trust the semantics of raw counters
+read using that configuration. (Just for reference, this is particularly
+valuable for tools that capture raw metrics for later, offline processing since
+the IDs effectively provide a compressed description of how to interpret the
+data by providing an index into a database of high-level counter descriptions.)
+
+The registry associates each ID with a hash of the HW register config as found in
+MDAPI XML files ('mdapi_config_hash') and also with a hash of the HW config as
+found in oa-\*.xml files ('config_hash'). The hashes used for lookups in the
+registry also help detect when the register config for a pre-existing metric set
+is updated. Note: these hashes are only for the low-level hardware configuration
+so updates to counter descriptions used by fronted UIs won't affect indexing
+here.
+
+There is a chicken and egg situation when updating or adding new entries to
+guids.xml since we can't hash the configs in oa-\*.xml until successfully running
+mdapi-xml-convert.py which depends on a guids.xml registry entry first. The
+update-guids.xml script will output registry entries without an oa-\*.xml config
+hash if not available and can be re-run after mdapi-xml-convert.py to add the
+missing hashes.
+
+2. Now run:
+```
+./update-guids.py --guids=guids.xml mdapi/MetricsXML_BDW.xml > guids.xml2
+```
+*(note the script expects to find oa-\*.xml files in the current directory)*
+
+Diff `guids.xml` and `guilds.xml2` (easiest with a side-by-side diff editor) and
+review the registry changes. *Note: many lines will have a warning like `"Not
+found in MDAPI XML file[s]..."` if `update-guids.xml` wasn't given all known
+MDAPI XML files but in this case they can be ignored for all non-BDW configs.*
+
+*Note: for any config that is already supported upstream in the i915 perf driver
+we need to be careful if the hash for a metric set changes in case the semantics
+for any raw counters were changed. The semantics of raw counters associated with
+a given GUID form part of the drm i915 perf uapi contract and must remain
+backwards compatible.*
+
+If the diff shows any `mdapi_config_hash` changes for pre-existing (especially
+upstream) configs you should review the MDAPI XML changes for the metric set and
+verify the change just relates to a bug fix. If more substantial changes were
+made which could mean we need to treat it as a new config. Handling the later
+case is left as an exercise to the reader, since it hasn't happened so far :-D.
+Assuming all the changes and new entries look good they can be copied into
+`guids.xml`, removing any trailing comment left by `update-guids.py`.
+
+3. Now run mdapi-xml-convert.py:
+```
+./mdapi-xml-convert.py --guids=guids.xml mdapi/MetricsXML_BDW.xml > oa-bdw.xml
+```
+
+4. We can now update new entries in guids.xml with a 'config_hash':
+```
+./update-guids.py --guids=guids.xml mdapi/MetricsXML_BDW.xml > guids.xml2
+```
+*(and again diff, check the changes and copy across)*
diff --git a/lib/i915/perf-configs/codegen.py b/lib/i915/perf-configs/codegen.py
new file mode 100644
index 00000000..0802547a
--- /dev/null
+++ b/lib/i915/perf-configs/codegen.py
@@ -0,0 +1,33 @@
+class Codegen:
+
+    _file = None
+    _indent = 0
+
+    endl="\n"
+    use_tabs = False
+
+    def __init__(self, filename = None):
+        if filename != None:
+            self._file = open(filename, 'w')
+
+    def __call__(self, *args):
+        if self._file:
+            code = ' '.join(map(str, args))
+            for line in code.splitlines():
+                indent = ''.rjust(self._indent)
+
+                if self.use_tabs:
+                    indent = indent.replace("        ", "\t")
+
+                text = indent + line
+                self._file.write(text.rstrip() + self.endl)
+
+    #without indenting or new lines
+    def frag(self, *args):
+        code = ' '.join(map(str, args))
+        self._file.write(code)
+
+    def indent(self, n):
+        self._indent = self._indent + n
+    def outdent(self, n):
+        self._indent = self._indent - n
diff --git a/lib/i915/perf-configs/guids.xml b/lib/i915/perf-configs/guids.xml
new file mode 100644
index 00000000..30ca0640
--- /dev/null
+++ b/lib/i915/perf-configs/guids.xml
@@ -0,0 +1,319 @@
+<!--
+    This is the authoritive registry of unique identifers for different OA unit
+    hardware configurations. Userspace can reliably use these identifiers to
+    map a configuration to corresponding normalization equations and counter
+    meta data.
+
+    Most maintenance is done using the update-guids.py helper script to generate
+    a temporary guids.xml.update file which should then be manually compared with
+    a visual diff tool to cherry pick the final changes into guids.xml.
+
+    See README.md for more details.
+-->
+<guids>
+    <guid id="2f01b241-7014-42a7-9eb6-a925cad3daba" chipset="all" name="MDAPI" />
+    <guid config_hash="b96ab550dbb61fa1d1a98b2d6f938e9c" mdapi_config_hash="c675607e7d1b0083729e4b1621fd25f8" id="a490e9d2-55b3-4db0-8dab-53011032c5f3" chipset="hsw" name="RenderBasic" />
+    <guid config_hash="3b656e19962cf1990cfb253a59946266" mdapi_config_hash="09199618ca154304fd42ca5ee19187f4" id="b344c8cb-a291-4cbf-aa9c-b40213bfc96f" chipset="hsw" name="ComputeBasic" />
+    <guid config_hash="bb978ccd4f1eca6d7806f304a42fb10f" mdapi_config_hash="77524b565825e61259436f526848c1e1" id="480f9795-cf6a-4204-a9e3-cd7015515f8d" chipset="hsw" name="ComputeExtended" />
+    <guid config_hash="890e4b72a09b71cb9c4522fbd8f7e45a" mdapi_config_hash="28d4ec8839e660bac90c3fbfa815ce45" id="399d3001-97d6-4240-b065-4fb843138e17" chipset="hsw" name="MemoryReads" />
+    <guid config_hash="904374d80088ec4941ab3c1dbed1aac0" mdapi_config_hash="6a8cbc42da4822a17d3de385d6811c1a" id="f3c1ff4b-d0da-4ffa-8780-2c6b98f3f2d5" chipset="hsw" name="MemoryWrites" />
+    <guid config_hash="35111d939881fd8e2367f89f86b43d19" mdapi_config_hash="4f8c749ea23ece9349cf690908159b6b" id="e111cda4-19c3-41ee-b326-f99ac44ebf78" chipset="hsw" name="SamplerBalance" />
+    <guid mdapi_config_hash="3c2ee9a97141f36bc13828aeda30e477" id="ce81ddfb-573f-4100-8b9a-8dc93a5e5c8c" chipset="hsw" name="RenderBalance" />
+    <guid mdapi_config_hash="7ffc6e4d3d2284ea76e9390b0fd8aaf1" id="2fbbb85b-0f33-4aeb-9d92-35256de2662f" chipset="hsw" name="MemoryReadsOnWritePort" />
+    <guid mdapi_config_hash="ff6824b311096312105547bbe5e65758" id="a1476140-3af3-4556-b5fe-501e2df8b963" chipset="hsw" name="StencilPmaHold" />
+    <guid mdapi_config_hash="414afdc7b2570bbbe07406ec675f3040" id="b3d5350e-32ba-4c72-96c2-0a504e86eda3" chipset="hsw" name="MediaMemoryReads" />
+    <guid mdapi_config_hash="cf80117b63d376e87735b73e8f5ebc5b" id="69b42918-c915-439a-9e4b-a82fe3c9e1a3" chipset="hsw" name="MediaMemoryWrites" />
+    <guid mdapi_config_hash="3566f20e9e3707cb9aefccff3ead7572" id="18024740-aa68-4d25-877e-082c9fdcb895" chipset="hsw" name="MediaVmePipe" />
+    <guid config_hash="240f9cd7a6699b44ff0bf22b24449ac0" mdapi_config_hash="961180e14745136637cfd0253c6c0a63" id="d6de6f55-e526-4f79-a6a6-d7315c09044e" chipset="bdw" name="TestOa" />
+    <guid config_hash="9c4955c220cbcc5f9ff3ce6e7af64cf5" mdapi_config_hash="7f7918e87f574f62cc4e8d37f660abc5" id="b541bd57-0e0f-4154-b4c0-5858010a2bf7" chipset="bdw" name="RenderBasic" />
+    <guid config_hash="35d980685774e3631a7e5eb4d23a0013" mdapi_config_hash="ea406bf4dc4e4edd5e29cce12bef1778" id="35fbc9b2-a891-40a6-a38d-022bb7057552" chipset="bdw" name="ComputeBasic" />
+    <guid config_hash="d17b0801f998c4b119c63b0467e8f9b5" mdapi_config_hash="fbde7829568089b44b53a1eefbad9b0e" id="8fb61ba2-2fbb-454c-a136-2dec5a8a595e" chipset="bdw" name="ComputeExtra" />
+    <guid config_hash="1bb1be4885c0568bf0d3bd5df9fe4a7a" mdapi_config_hash="f0c3b043834e63d21ba6be573df02e32" id="233d0544-fff7-4281-8291-e02f222aff72" chipset="bdw" name="RenderPipeProfile" />
+    <guid config_hash="9147786065e1562d254a1dc82c14b4f9" mdapi_config_hash="fa121c59e98aa4f860c797bfab097cd7" id="2b255d48-2117-4fef-a8f7-f151e1d25a2c" chipset="bdw" name="MemoryReads" />
+    <guid config_hash="13cadf5e130b16bf6cf777e34ff54fcf" mdapi_config_hash="7e324f6f7cb980832735ada1e12f7905" id="f7fd3220-b466-4a4d-9f98-b0caf3f2394c" chipset="bdw" name="MemoryWrites" />
+    <guid config_hash="552b53f8d91428cec6eab6bff62ae8af" mdapi_config_hash="6ba093cf3feb68f521e579169ad689cf" id="e99ccaca-821c-4df9-97a7-96bdb7204e43" chipset="bdw" name="ComputeExtended" />
+    <guid config_hash="2cf68f22eadf4cb430a7e2a76fab3632" mdapi_config_hash="e9913c0dd30d6ccab98c5dec58dc7162" id="27a364dc-8225-4ecb-b607-d6f1925598d9" chipset="bdw" name="ComputeL3Cache" />
+    <guid config_hash="15d5387219cda641a8964b9edeb86b6d" mdapi_config_hash="fc357f19e2a77465c3232693f3bb1444" id="857fc630-2f09-4804-85f1-084adfadd5ab" chipset="bdw" name="DataPortReadsCoalescing" />
+    <guid config_hash="95a2d953682c60ee0213c41892067b94" mdapi_config_hash="be3980a5f0e6057e641b884fc56b07ff" id="343ebc99-4a55-414c-8c17-d8e259cf5e20" chipset="bdw" name="DataPortWritesCoalescing" />
+    <guid config_hash="9004a46b9728e0f12232ce8b151d3224" mdapi_config_hash="715fe2c431914b6b369970c0b897f7e2" id="e1743ca0-7fc8-410b-a066-de7bbb9280b7" chipset="bdw" name="VMEPipe" />
+    <guid config_hash="bb8d49db81e7bd822188ed5a958b4863" mdapi_config_hash="f94fd6ba5bfa83bb965705f1c69f1d37" id="78490af2-10fa-430b-ae3c-94ec04d5214e" chipset="bdw" name="HDCAndSF" />
+    <guid config_hash="19924ef1563f10e386755b531d44a3fb" mdapi_config_hash="a5589479b360f6d4f5c8f70fe78b0e1d" id="c0abdd97-3b13-4cad-814c-bd178804e02c" chipset="bdw" name="L3_1" />
+    <guid config_hash="41217f1f74d9e181726736ab9af57c32" mdapi_config_hash="0fc152bfbb920f90b16ed0445afe9e48" id="ad665281-a7cf-483a-bd10-0e07c43f61c7" chipset="bdw" name="L3_2" />
+    <guid config_hash="f17717dae4348688c670212b507d451a" mdapi_config_hash="2afc3cdd7ffbb021fc0ae99681b138ab" id="930a15aa-4300-4fce-a9ba-edb0b9e880be" chipset="bdw" name="L3_3" />
+    <guid config_hash="71232cf595afad2b53666f6c233447e8" mdapi_config_hash="032c9ab7c2c6d056da82e4ee1b159c18" id="d7793b26-b5e3-4f0f-ad78-7ebc9d0b4c7d" chipset="bdw" name="L3_4" />
+    <guid config_hash="b8a474b7965b6d9ec62641732d0d479b" mdapi_config_hash="b2454e1eef8d38d83cb95ba2b3d85431" id="da0f7875-1143-4d73-a39c-9128a951c46a" chipset="bdw" name="RasterizerAndPixelBackend" />
+    <guid config_hash="f8f05a9f4ce4bd928f1343180584f7de" mdapi_config_hash="6fb026e2926fbd3a507e55a7bf0a3687" id="52c186e4-39e3-4534-87cd-41bd47763df9" chipset="bdw" name="Sampler_1" />
+    <guid config_hash="30ee983d5ba223ad552acc3debc13c00" mdapi_config_hash="e38e63da0d875958bc88a9deb8d529ba" id="edcb8c31-764d-451a-9ecd-c9c89fb54f8d" chipset="bdw" name="Sampler_2" />
+    <guid config_hash="bbc70da24570ab578fb1416217fc0834" mdapi_config_hash="c905876bdf561cc26c64363ced258c64" id="729fc3f4-ccff-4902-be6b-f1a22cc92c02" chipset="bdw" name="TDL_1" />
+    <guid config_hash="803ca6eb4feef4090332003b65607c95" mdapi_config_hash="0000753d7f52fb3a0b0baa6b44052cff" id="29598975-4785-43ab-a981-1dfa58d0e835" chipset="bdw" name="TDL_2" />
+    <guid config_hash="c45ebb398888eabb889be632432550eb" mdapi_config_hash="a3c52d64b6d187b02de43af112abc509" id="0a9eb7be-feee-4275-a139-6d9cedf0fdb0" chipset="bdw" name="GpuBusyness" />
+    <guid config_hash="13a7f7de484592659ef4d346901bde25" mdapi_config_hash="59cd2454083f4855dca14637425d733c" id="e713f347-953e-4d8c-b02f-6be31df2db2b" chipset="bdw" name="STC_PmaStall" />
+    <guid config_hash="867e736ad8c49a9f4cd17b58f1b0b0cc" mdapi_config_hash="d996104bf7531170226275d44a3602b6" id="4a534b07-cba3-414d-8d60-874830e883aa" chipset="chv" name="TestOa" />
+    <guid config_hash="4fe7c53a36b24f621e11a1487d46e325" mdapi_config_hash="089852d3f5babff2175457f57214ce57" id="9d8a3af5-c02c-4a4a-b947-f1672469e0fb" chipset="chv" name="RenderBasic" />
+    <guid config_hash="6472c5788ff47d2f8f88b86b7314c09e" mdapi_config_hash="60375bf6570a28320cce512ab6d024e0" id="f522a89c-ecd1-4522-8331-3383c54af5f5" chipset="chv" name="ComputeBasic" />
+    <guid config_hash="532bafcf355d5812242ab50a362bf934" mdapi_config_hash="1466be3c679aeeb0627be174ead35e58" id="a9ccc03d-a943-4e6b-9cd6-13e063075927" chipset="chv" name="RenderPipeProfile" />
+    <guid config_hash="bb8d49db81e7bd822188ed5a958b4863" mdapi_config_hash="f94fd6ba5bfa83bb965705f1c69f1d37" id="33af8252-7a51-4aa3-b0ba-1b946f209d7b" chipset="chv" name="HDCAndSF" />
+    <guid config_hash="19924ef1563f10e386755b531d44a3fb" mdapi_config_hash="a5589479b360f6d4f5c8f70fe78b0e1d" id="78f52900-5317-4417-8067-966fbf215a1f" chipset="chv" name="L3_1" />
+    <guid config_hash="41217f1f74d9e181726736ab9af57c32" mdapi_config_hash="0fc152bfbb920f90b16ed0445afe9e48" id="0db4fe4a-2648-4064-bd6a-89c06d0c27b3" chipset="chv" name="L3_2" />
+    <guid config_hash="f17717dae4348688c670212b507d451a" mdapi_config_hash="2afc3cdd7ffbb021fc0ae99681b138ab" id="0de6539e-33b4-4aee-83c4-9ab45a579b94" chipset="chv" name="L3_3" />
+    <guid config_hash="71232cf595afad2b53666f6c233447e8" mdapi_config_hash="032c9ab7c2c6d056da82e4ee1b159c18" id="be74c9d6-268f-4d7f-b2e8-8d91d4441883" chipset="chv" name="L3_4" />
+    <guid config_hash="b8a474b7965b6d9ec62641732d0d479b" mdapi_config_hash="b2454e1eef8d38d83cb95ba2b3d85431" id="31bc1ff3-8d09-4497-9d79-59c4f943b502" chipset="chv" name="RasterizerAndPixelBackend" />
+    <guid config_hash="f8f05a9f4ce4bd928f1343180584f7de" mdapi_config_hash="6fb026e2926fbd3a507e55a7bf0a3687" id="05450fec-bb5c-4b0a-8995-e03631168a34" chipset="chv" name="Sampler_1" />
+    <guid config_hash="30ee983d5ba223ad552acc3debc13c00" mdapi_config_hash="e38e63da0d875958bc88a9deb8d529ba" id="883c8a56-8767-4de8-beec-a99462c6674b" chipset="chv" name="Sampler_2" />
+    <guid config_hash="bbc70da24570ab578fb1416217fc0834" mdapi_config_hash="c905876bdf561cc26c64363ced258c64" id="eb97e523-d9ac-48a9-b7f8-9cc909ddbf14" chipset="chv" name="TDL_1" />
+    <guid config_hash="803ca6eb4feef4090332003b65607c95" mdapi_config_hash="0000753d7f52fb3a0b0baa6b44052cff" id="dff6158e-8409-452c-be76-91c9946330bd" chipset="chv" name="TDL_2" />
+    <guid mdapi_config_hash="5cc4d10d745060d0672ffb4ebf0d1687" id="22480aac-b81a-40ce-8770-1061ce51dff7" chipset="chv" name="StencilPmaHold" />
+    <guid mdapi_config_hash="f3ae7e16e9b6aadac98179bc4c847246" id="f8315f64-668e-405e-a6d6-c52e4d9e8f1c" chipset="chv" name="MediaMemoryReads" />
+    <guid mdapi_config_hash="ea98859ab4afdda2589be697455c7dc8" id="6df9f4c3-4775-4f47-be6a-991fba7a02c7" chipset="chv" name="MediaMemoryWrites" />
+    <guid mdapi_config_hash="179e6a40c74a8401597b82383dacfd70" id="e7b839a6-6045-4ec7-aaa5-f6aab87a55aa" chipset="chv" name="MediaVmePipe" />
+    <guid mdapi_config_hash="3ed20c9f7071cef87fd28d2f899c9e6c" id="aa7d6b37-3e8f-46a4-ab50-e58f8efbdab9" chipset="chv" name="HdcUrbCoalescing" />
+    <guid mdapi_config_hash="b39b58578bb37520010084d2fb489c47" id="d991c4b4-7c8b-43a9-b187-7b143cb903cc" chipset="chv" name="L3" />
+    <guid mdapi_config_hash="36c6e4beda33281c27a79f4134ea9f80" id="531d4a91-df08-4dd4-8c5c-0158321a9ee0" chipset="chv" name="SamplerAndHDCAndTDL" />
+    <guid mdapi_config_hash="959a0f3d993feb51a3ce93ea3b61d726" id="ca514a15-e550-4277-ba52-b7cfa4929e25" chipset="chv" name="TDL" />
+    <guid mdapi_config_hash="f1232ea7b1a2bc5b0cfc7d640528e5b2" id="2a933a92-bddc-44dd-a06a-672391972b5e" chipset="chv" name="ComputeL3Cache" />
+    <guid config_hash="e018d083414e4d28e0ed481554128883" mdapi_config_hash="dce59e977ffff25a57f2486f5d9a7c60" id="5ee72f5c-092f-421e-8b70-225f7c3e9612" chipset="bxt" name="TestOa" />
+    <guid config_hash="203852243e7fde6887b1db92862d5eee" mdapi_config_hash="9bf85c8db90bbb173411dd8fbf2c9d90" id="22b9519a-e9ba-4c41-8b54-f4f8ca14fa0a" chipset="bxt" name="RenderBasic" />
+    <guid config_hash="cde046a01aba9c56d6fa44bf2c0f26c2" mdapi_config_hash="86794812560853ea5531d6eb816c7bfa" id="012d72cf-82a9-4d25-8ddf-74076fd30797" chipset="bxt" name="ComputeBasic" />
+    <guid config_hash="a19a55aad269ccc1ed4380314eda4bed" mdapi_config_hash="ac34c2028f3f4fae92e58aae1496901b" id="fa6ecf21-2cb8-4d0b-9308-6e4a7b4ca87a" chipset="bxt" name="ComputeExtra" />
+    <guid config_hash="1669463a6836f6d057cbf3e41506923b" mdapi_config_hash="c4b66b414f42b7e6f1b9941b445f79f2" id="ce416533-e49e-4211-80af-ec513590a914" chipset="bxt" name="RenderPipeProfile" />
+    <guid config_hash="f9eee3f0c9653ffd05e4876be0ea44d5" mdapi_config_hash="f707783ff8ea456ddc55fbaeb1a3bc0a" id="398e2452-18d7-42d0-b241-e4d0a9148ada" chipset="bxt" name="MemoryReads" />
+    <guid config_hash="03e840f1d8597b3c6c4015792243ce7d" mdapi_config_hash="b7e416688493d93c6a319a39c1c91fda" id="d324a0d6-7269-4847-a5c2-6f71ddc7fed5" chipset="bxt" name="MemoryWrites" />
+    <guid config_hash="39a03c065f1fdb5bf680207dc520cdb2" mdapi_config_hash="c90ecb54cbe7609fc6743f5273b68962" id="caf3596a-7bb1-4dec-b3b3-2a080d283b49" chipset="bxt" name="ComputeExtended" />
+    <guid config_hash="c241c2999f487dc995cecdb35b01197b" mdapi_config_hash="03f5a72e5e1ce82b6e3e14855298bf3d" id="49b956e2-d5b9-47e0-9d8a-cee5e8cec527" chipset="bxt" name="ComputeL3Cache" />
+    <guid config_hash="37dc8ae76c2554b11ecea682f1349ece" mdapi_config_hash="16b7f908edc7ee5ddb797c6fb1932fa6" id="ad9d9bc2-ccb7-4f5d-adbb-b4e67e615efd" chipset="bxt" name="HDCAndSF" />
+    <guid config_hash="543b9bdb10f681d516d8d9e2195221cd" mdapi_config_hash="87f92d7860a6674bf05428c26523755b" id="bde7b434-349c-4aad-8596-eb23c0352168" chipset="bxt" name="L3_1" />
+    <guid config_hash="1dc29cbbceb8e2e1a78d679ead80a27b" mdapi_config_hash="c7ec60f268b8efa00960e96dc9491517" id="f3d845e6-bfc3-4ffe-b0e5-dddc80c21f07" chipset="bxt" name="RasterizerAndPixelBackend" />
+    <guid config_hash="0b9e45ed32513193354be363e288b6a6" mdapi_config_hash="ad512c0f8b7457df8edca72ddea75e64" id="a53d620b-c14e-49df-bd27-e076b3fb98f3" chipset="bxt" name="Sampler" />
+    <guid config_hash="3f01b8d28fa285e7a496081574de4c1b" mdapi_config_hash="963e6d32bfe8cee347a8ae14d677c11c" id="8a44b172-6e1d-445f-8937-c06cc487ba39" chipset="bxt" name="TDL_1" />
+    <guid config_hash="0c77cba2d8886c18df9f382ce90eac66" mdapi_config_hash="a66f0092b99ca3a8ce29e0ce4be513ff" id="9d4643f8-aa05-482e-8193-070a8ab0d117" chipset="bxt" name="TDL_2" />
+    <guid config_hash="e6d52ba7af730de63eeaa8d727b36ed7" mdapi_config_hash="6898bc10a62600907cc6c47d1f7004a0" id="c9f5fa3a-d14f-400c-a89a-211206b00ee7" chipset="bxt" name="GpuBusyness" />
+    <guid config_hash="6d13f443205926fd1351ae5adeae8965" mdapi_config_hash="24f384a77963d7d64c324b3d89eeb498" id="d49cd0d8-8c7f-4465-94fc-51e08c9050bc" chipset="bxt" name="PMA_Stall" />
+    <guid config_hash="fc79f102b841df08ac154ddebc634bf6" mdapi_config_hash="3c97b92455702ca6f6a6f846dcc1ebd3" id="07b25942-d9fd-4fce-bd58-e29abd66b7de" chipset="sklgt2" name="RenderBasic" />
+    <guid config_hash="3e0e14aef4a2cf7e61098928c034caff" mdapi_config_hash="ecb641130c942e71d5a9de8adb51c7f6" id="00b80b4c-d215-4378-9015-da3dda3b61ea" chipset="sklgt2" name="ComputeBasic" />
+    <guid config_hash="d757768d43838dd04e2db7e9928c87d9" mdapi_config_hash="79c6baee9374a6c43b8e0fabda2c1a39" id="2a0c0933-37e7-427c-9951-ded42a78bb27" chipset="sklgt2" name="RenderPipeProfile" />
+    <guid config_hash="15938384237d1b01ceb07bc97edd12a9" mdapi_config_hash="22327f250c6079d5d5f9f1a70829dc05" id="246b35f1-44e0-4d03-8936-e452e291d064" chipset="sklgt2" name="MemoryReads" />
+    <guid config_hash="a0c0e0b3ad6e0960c9e3c626e9943c3b" mdapi_config_hash="5dcf9b09ab723e2f4ed17171a2b54a59" id="e0d3da02-00bf-4a96-9795-b48158c73a68" chipset="sklgt2" name="MemoryWrites" />
+    <guid config_hash="31bc9b67c237e4be9469d38ba69ec374" mdapi_config_hash="37e00c6654e34eaab18b6f3b2c606a16" id="c26b1fda-2752-4a33-a448-4c8718366846" chipset="sklgt2" name="ComputeExtended" />
+    <guid config_hash="a142f4714f9189816e129d2bf7ddd060" mdapi_config_hash="cdf98d85d93792dc203d2bfd7ae7559c" id="9fb22842-e708-43f7-9752-e0e41670c39e" chipset="sklgt2" name="ComputeL3Cache" />
+    <guid config_hash="977641d9cac7a2eb62c1c6cc844db2b5" mdapi_config_hash="a70cc632725191096cec1d685119aeb6" id="b4aa5e13-2d25-418f-827d-421f5cc4c43b" chipset="sklgt2" name="HDCAndSF" />
+    <guid config_hash="45aaf271f503f5d5d152b6d97c11412d" mdapi_config_hash="6b111ab20f6929a385eee8d283768ac1" id="504000e8-64f2-4aac-8301-51b81aa60d45" chipset="sklgt2" name="L3_1" />
+    <guid config_hash="6221743043a92819571c49bde5e09582" mdapi_config_hash="0b87bde0336f1d126527c9d8b0e6fa3c" id="f542479b-6685-4670-ad8e-9fe282a2eb5b" chipset="sklgt2" name="L3_2" />
+    <guid config_hash="b6320b7867895a125dec55805a8da286" mdapi_config_hash="7eae454eee816d64ff0fbb991ad4e9b9" id="1cbf1e9f-c2de-4cc2-8d1c-2c33c25a2332" chipset="sklgt2" name="L3_3" />
+    <guid config_hash="35f7405d36fe5767f4c1e80b322243d1" mdapi_config_hash="78b90bbcc0137b2c6e516cb32d44747c" id="b4e54cc8-a3a0-4ccd-9990-65d3184e5a38" chipset="sklgt2" name="RasterizerAndPixelBackend" />
+    <guid config_hash="6e2319f2ca15bfb049b2d1be6d1a0844" mdapi_config_hash="73ceeb4df0d124c61328ecf2c0207503" id="efe7eba4-fd9e-4a09-a92b-334970b5de57" chipset="sklgt2" name="Sampler" />
+    <guid config_hash="90eff0b1f381a2f187bd54f2047ce0f2" mdapi_config_hash="e0913ff09629a32c435487a69f6683b9" id="e9bd0bbb-c7b7-4a26-a27a-246987354776" chipset="sklgt2" name="TDL_1" />
+    <guid config_hash="c41684d2ccbe553874fb9cdbd8fd0229" mdapi_config_hash="6b1a9dc8dd375bf367313ad9b0531580" id="0a7accbf-8c55-455f-9984-23e9fb0b826d" chipset="sklgt2" name="TDL_2" />
+    <guid config_hash="483a06910590c1753a0266ef8b9f9b70" mdapi_config_hash="4be337ed83e3c95aebf66553ed685602" id="41a24047-7484-4ead-ae37-de907e5ff2b2" chipset="sklgt2" name="ComputeExtra" />
+    <guid config_hash="784698b7fb41dad7bc4bf13fac46657b" mdapi_config_hash="2fe32bdaf82fc66774ee95c33a23ea88" id="95910492-943f-44bd-9461-390240f243fd" chipset="sklgt2" name="VMEPipe" />
+    <guid config_hash="d2e36c07c43f128370fe1112d4de1181" mdapi_config_hash="d569893983ce055b9021b64420894431" id="1651949f-0ac0-4cb1-a06f-dafd74a407d1" chipset="sklgt2" name="TestOa" />
+    <guid config_hash="ee7996e47cdaf7722422397285763cdc" mdapi_config_hash="ada812fc71ebbabd1e746dbab67881b1" id="c44a5cf7-886d-477b-bebd-2d738923e4c3" chipset="sklgt2" name="GpuBusyness" />
+    <guid config_hash="cec6202194db96d6a09fed71808bb7de" mdapi_config_hash="df4b9b85ed61f457a0b71b03299b282d" id="e0b2aae4-9b8f-4211-8df0-f8e8cb203209" chipset="sklgt2" name="FfBottlenecks" />
+    <guid config_hash="8ae5bda74271c473f88f13e57d6f6828" mdapi_config_hash="e7f3f72cad542f3a17c09686e65487fc" id="27871149-2fa9-40ba-aa73-350d60c03a09" chipset="sklgt2" name="PMA_Stall" />
+    <guid config_hash="a7f1b241b23898785166ab10ca4ce1bf" mdapi_config_hash="ae3528402606bbb21a08da7ef5ea1530" id="21fef15a-83f4-4ffa-bb81-7da6e38b8e4b" chipset="sklgt3" name="RenderBasic" />
+    <guid config_hash="ede53df6549f788495f7fca90475b6dd" mdapi_config_hash="87390c127ce809c3cfab64388ddebd14" id="4320492b-fd03-42ac-922f-dbe1ef3b7b58" chipset="sklgt3" name="ComputeBasic" />
+    <guid config_hash="0f8eee02ed3e457362ffdc38ed10036c" mdapi_config_hash="2d95f03caa28b40e2a25f3bc8ac38b55" id="bd2d9cae-b9ec-4f5b-9d2f-934bed398a2d" chipset="sklgt3" name="RenderPipeProfile" />
+    <guid config_hash="0a75401250565ee5a0e555b47bc9e5b4" mdapi_config_hash="5218add4f4b16f3db5c92225871eb44c" id="4ca0f3fe-7fd3-4924-98cb-1807d9879767" chipset="sklgt3" name="MemoryReads" />
+    <guid config_hash="2ed5869dae575556e0895b0d0081555c" mdapi_config_hash="adc8e37f86eda900faf1fdb41f5dc3ee" id="a0c0172c-ee13-403d-99ff-2bdf6936cf14" chipset="sklgt3" name="MemoryWrites" />
+    <guid config_hash="6566c55fdf1de8ae73008029a674ecc9" mdapi_config_hash="f3ce984974a95b391e835b3a75aa7813" id="52435e0b-f188-42ea-8680-21a56ee20dee" chipset="sklgt3" name="ComputeExtended" />
+    <guid config_hash="f660e82bbeca0b5d2d31a98dac8eb940" mdapi_config_hash="7b6f81c79c79fb31b0fe5eea542e479f" id="27076eeb-49f3-4fed-8423-c66506005c63" chipset="sklgt3" name="ComputeL3Cache" />
+    <guid config_hash="2c6650c2422869aa2624b26f7a7c51bc" mdapi_config_hash="1ce5fbfd5db4183dfc3ab6bf4badfd59" id="a1b8363b-b986-47b6-929a-847afde3dec8" chipset="sklgt3" name="HDCAndSF" />
+    <guid config_hash="3ead5919c426a00ef6697e21df33ef07" mdapi_config_hash="269534866dc93d83e1e5934bd4900a89" id="fa857069-7f95-44c9-a3e0-cb8ccbc35abb" chipset="sklgt3" name="L3_1" />
+    <guid config_hash="2d0a88cdba58ddf18642fde563edb4d8" mdapi_config_hash="745f63effe3156a5f358999d45bd66c6" id="9830a5f3-a5e2-4773-a49d-6371407c382a" chipset="sklgt3" name="L3_2" />
+    <guid config_hash="d3972886309fa3701f3d3ae185f57cbe" mdapi_config_hash="b46614ab9a28c8a7fe88897cd72437bd" id="59452ceb-24bb-4878-87ec-87aab7b4f9db" chipset="sklgt3" name="L3_3" />
+    <guid config_hash="90ecbd5ae5ae6d3c0f756c7411351c85" mdapi_config_hash="7d797e538b84f6682caacdfb299145d9" id="d2249ff7-34b4-4203-b474-7c11546f9dae" chipset="sklgt3" name="RasterizerAndPixelBackend" />
+    <guid config_hash="5a628cbf246226c19fed41479cf17de1" mdapi_config_hash="1db0203064f7e2f8cb02901fe29a1d33" id="c9cf7c63-0065-4226-941e-98590bad8f75" chipset="sklgt3" name="Sampler" />
+    <guid config_hash="f48609e1a79093073b96726c3c4c63a6" mdapi_config_hash="781425b1a57e4ea0010105f565567161" id="e3bb1501-89ca-43fb-8668-9d96159e10a2" chipset="sklgt3" name="TDL_1" />
+    <guid config_hash="93ab6cf80fefdfca540a3ac101925411" mdapi_config_hash="66d2a4df7b3190be8bd9643e1cb14f99" id="29194a55-7e75-4152-a71f-ef34b1ae4cca" chipset="sklgt3" name="TDL_2" />
+    <guid config_hash="3ca2784da64d161a998b7d8f6d4e0235" mdapi_config_hash="5796dcc1e154e567d7758854bb621bcb" id="2d80a648-7b5a-4e92-bbe7-3b5c76f2e221" chipset="sklgt3" name="ComputeExtra" />
+    <guid config_hash="54b2a9ae72018dd99e63c2ecd9c92901" mdapi_config_hash="6ae821fe8ac78f4b387f9eec605ac900" id="cfae9232-6ffc-42cc-a703-9790016925f0" chipset="sklgt3" name="VMEPipe" />
+    <guid config_hash="cca1580576ffa8e25aa271ebdac68cc7" mdapi_config_hash="d05fe58178a1882edcb81d86070551e3" id="2b985803-d3c9-4629-8a4f-634bfecba0e8" chipset="sklgt3" name="TestOa" />
+    <guid config_hash="6124b939906bc3cda3621544aabfd890" mdapi_config_hash="24ef7b4026d1ac159bb663946df0e9b0" id="0c5058ff-fdf4-4e0d-81fb-c0310fb76525" chipset="sklgt3" name="GpuBusyness" />
+    <guid config_hash="8ae5bda74271c473f88f13e57d6f6828" mdapi_config_hash="4d9fb617c64406cc8b372808461dd3e3" id="c889fd93-8dc7-4ba5-9451-de34a8b5ea3f" chipset="sklgt3" name="PMA_Stall" />
+    <guid config_hash="0a80b2a2caa3386ecce110a7904eb1c1" mdapi_config_hash="61d002ce457b9ce087613d986e6b0544" id="95322a71-bb05-4437-bc27-f7dd7b27d136" chipset="sklgt4" name="RenderBasic" />
+    <guid config_hash="898ee42bb4b359d4c0eb97c5919cfd7f" mdapi_config_hash="d596d8f326e5378b871b825eb954e95c" id="7277228f-e7f3-4743-945a-6a2049d11377" chipset="sklgt4" name="ComputeBasic" />
+    <guid config_hash="48b5556f95fc27dceb10c65556a16613" mdapi_config_hash="95e3f2b556fe9795e0d0e0d3b0c5ee00" id="463c668c-3f60-49b6-8f85-d995b635b3b2" chipset="sklgt4" name="RenderPipeProfile" />
+    <guid config_hash="0a75401250565ee5a0e555b47bc9e5b4" mdapi_config_hash="d39a578cdf930d109c992f4abd7f83cb" id="3ae6e74c-72c3-4040-9bd0-7961430b8cc8" chipset="sklgt4" name="MemoryReads" />
+    <guid config_hash="2ed5869dae575556e0895b0d0081555c" mdapi_config_hash="603b987097b9d84c53eb55c60272b286" id="055f256d-4052-467c-8dec-6064a4806433" chipset="sklgt4" name="MemoryWrites" />
+    <guid config_hash="6566c55fdf1de8ae73008029a674ecc9" mdapi_config_hash="26c920eddaf1b7e2d58c37a96d4076bd" id="753972d4-87cd-4460-824d-754463ac5054" chipset="sklgt4" name="ComputeExtended" />
+    <guid config_hash="96d8e8d820ebad84b71c222f3c448ec5" mdapi_config_hash="182cd4a00f7a24a0c844bf9f8435419e" id="4e4392e9-8f73-457b-ab44-b49f7a0c733b" chipset="sklgt4" name="ComputeL3Cache" />
+    <guid config_hash="25ad6a99a2b00414d4747035af7fac94" mdapi_config_hash="f69a28470a231f8d0c20e3173274cf88" id="75f56991-b149-4122-ade9-d9c0c80c733b" chipset="sklgt4" name="HDCAndSF" />
+    <guid config_hash="3ead5919c426a00ef6697e21df33ef07" mdapi_config_hash="52b2279e32293bfe3cf97e443940215a" id="0d4cda70-da83-466f-b61e-7a064fe6a232" chipset="sklgt4" name="L3_1" />
+    <guid config_hash="2d0a88cdba58ddf18642fde563edb4d8" mdapi_config_hash="1541624f29b55f8abf422eaa813657e7" id="20137ace-b110-4341-883f-1094c820093c" chipset="sklgt4" name="L3_2" />
+    <guid config_hash="d3972886309fa3701f3d3ae185f57cbe" mdapi_config_hash="c734154b7a9bd205b8bfb176211873c3" id="d3a6b05e-46ef-44a8-96c3-9bd3e58acbe6" chipset="sklgt4" name="L3_3" />
+    <guid config_hash="90ecbd5ae5ae6d3c0f756c7411351c85" mdapi_config_hash="0fbb2b2f53429b0a25a6628c1fb21b32" id="4081b948-63f1-4b1a-abaa-6017cb77a63b" chipset="sklgt4" name="RasterizerAndPixelBackend" />
+    <guid config_hash="5a628cbf246226c19fed41479cf17de1" mdapi_config_hash="032dea8a40f7c0bbe2c9e0a238df248d" id="eae6bbb1-0e2b-478d-bd9e-f10ded2178f9" chipset="sklgt4" name="Sampler" />
+    <guid config_hash="f48609e1a79093073b96726c3c4c63a6" mdapi_config_hash="39a8e4da917b0874b8e697f203a641ff" id="1bba4bd2-81d4-45ec-847f-bc363e17e14d" chipset="sklgt4" name="TDL_1" />
+    <guid config_hash="93ab6cf80fefdfca540a3ac101925411" mdapi_config_hash="60b1253d54ce38bb6678d9a3eaa10305" id="a4b3106c-cfec-49f5-8e26-470470379e66" chipset="sklgt4" name="TDL_2" />
+    <guid config_hash="19cb1c38ee83566f630015215532efa5" mdapi_config_hash="f9ae90355e5abe786bf5e81f1c4222c0" id="a5aa857d-e8f0-4dfa-8981-ce340fa748fd" chipset="sklgt4" name="ComputeExtra" />
+    <guid config_hash="b28f9fef3bf5699c217d634bffa57fbc" mdapi_config_hash="cafc4d5abc6807434093d4f47fe83292" id="0e8d8b86-4ee7-4cdd-aaaa-58adc92cb29e" chipset="sklgt4" name="VMEPipe" />
+    <guid config_hash="cca1580576ffa8e25aa271ebdac68cc7" mdapi_config_hash="051007cbfaffa4151d7c9365edde7bff" id="882fa433-1f4a-4a67-a962-c741888fe5f5" chipset="sklgt4" name="TestOa" />
+    <guid config_hash="6124b939906bc3cda3621544aabfd890" mdapi_config_hash="24ef7b4026d1ac159bb663946df0e9b0" id="4e5b1599-5b01-4b3d-89fa-6b26a25fe02b" chipset="sklgt4" name="GpuBusyness" />
+    <guid config_hash="8ae5bda74271c473f88f13e57d6f6828" mdapi_config_hash="4d9fb617c64406cc8b372808461dd3e3" id="befe9fd6-474e-4a3d-b98e-cd793715cf91" chipset="sklgt4" name="PMA_Stall" />
+    <guid config_hash="afbe2cb999a8303f52eea075f3b8687e" mdapi_config_hash="966416aaaf33b0bce90c0daa51217242" id="99c1a40e-a090-4354-86e3-4d068bb1917e" chipset="kblgt2" name="RenderBasic" />
+    <guid config_hash="b1268f0f246efc7ab27f7637fa7193e8" mdapi_config_hash="c72d95bf362111446018c52210ec48b6" id="12994724-3a5a-4303-bb3c-ba0175d2c200" chipset="kblgt2" name="ComputeBasic" />
+    <guid config_hash="01f86f590b9b0c0371b0075a5e73b902" mdapi_config_hash="7ee27e7f11eea3282e62abde604b61a2" id="d7a17a3a-ca71-40d2-a919-ace80d50633f" chipset="kblgt2" name="RenderPipeProfile" />
+    <guid config_hash="0a75401250565ee5a0e555b47bc9e5b4" mdapi_config_hash="0779bba85f8be3baef98ecc5c66fd369" id="57b59202-172b-477a-87de-33f85572c589" chipset="kblgt2" name="MemoryReads" />
+    <guid config_hash="2ed5869dae575556e0895b0d0081555c" mdapi_config_hash="26eb749438ad7d42e34342048c1019c5" id="3addf8ef-8e9b-40f5-a448-3dbb5d5128b0" chipset="kblgt2" name="MemoryWrites" />
+    <guid config_hash="6566c55fdf1de8ae73008029a674ecc9" mdapi_config_hash="aa2dd4e7d446e3ce29dfeaf8f393243e" id="4af0400a-81c3-47db-a6b6-deddbd75680e" chipset="kblgt2" name="ComputeExtended" />
+    <guid config_hash="33bdd2160049aa831e025e1be7a453c5" mdapi_config_hash="2770df840fca647230d55b79f686ae11" id="0e22f995-79ca-4f67-83ab-e9d9772488d8" chipset="kblgt2" name="ComputeL3Cache" />
+    <guid config_hash="5736948ed298fd6e8cc80222e1e03077" mdapi_config_hash="c056251351b0b1f5beb4f6863484854b" id="fb149d66-fad2-4230-b0d7-4d689b9116d3" chipset="kblgt2" name="HDCAndSF" />
+    <guid config_hash="3ead5919c426a00ef6697e21df33ef07" mdapi_config_hash="17d38bff109de8e5622ff29bead0bbcf" id="f889f8cc-4c93-4ac8-b75f-551c0b9b87f7" chipset="kblgt2" name="L3_1" />
+    <guid config_hash="2d0a88cdba58ddf18642fde563edb4d8" mdapi_config_hash="1a88f6816aea2c42dae9f10d4233cb74" id="6d344efd-8e9e-42d4-a29e-1011c29f82c2" chipset="kblgt2" name="L3_2" />
+    <guid config_hash="d3972886309fa3701f3d3ae185f57cbe" mdapi_config_hash="ae28a594b1a6fd3864272da8dbe873f5" id="e3b386ae-c195-47d5-af29-8a1afa0ae2bf" chipset="kblgt2" name="L3_3" />
+    <guid config_hash="90ecbd5ae5ae6d3c0f756c7411351c85" mdapi_config_hash="d1b2421e43a489ffcdfeeaf271b2f12f" id="f9954679-a055-4862-9f57-9d66e3ebf81c" chipset="kblgt2" name="RasterizerAndPixelBackend" />
+    <guid config_hash="5a628cbf246226c19fed41479cf17de1" mdapi_config_hash="8d5f977be4f4d21e97e9e67786958495" id="4ed5e27e-fd1a-4f11-ad8f-9374e128c697" chipset="kblgt2" name="Sampler" />
+    <guid config_hash="f48609e1a79093073b96726c3c4c63a6" mdapi_config_hash="cbef2ea0f1c6e30bd37cea22a87e8373" id="9eaf384d-8f53-41b8-a71d-108308780fbc" chipset="kblgt2" name="TDL_1" />
+    <guid config_hash="93ab6cf80fefdfca540a3ac101925411" mdapi_config_hash="b685ab8fe6fc020e85f189f55fdf6e05" id="a00cbdf2-eabd-4240-9a89-86e2ac1ca1e4" chipset="kblgt2" name="TDL_2" />
+    <guid config_hash="483a06910590c1753a0266ef8b9f9b70" mdapi_config_hash="4be337ed83e3c95aebf66553ed685602" id="aa7a3fb9-22fb-43ff-a32d-0ab6c13bbd16" chipset="kblgt2" name="ComputeExtra" />
+    <guid config_hash="784698b7fb41dad7bc4bf13fac46657b" mdapi_config_hash="2fe32bdaf82fc66774ee95c33a23ea88" id="398a4268-ef6f-4ffc-b55f-3c7b5363ce61" chipset="kblgt2" name="VMEPipe" />
+    <guid config_hash="cca1580576ffa8e25aa271ebdac68cc7" mdapi_config_hash="5f4afc2f159098e96b8fd90a85979ae3" id="baa3c7e4-52b6-4b85-801e-465a94b746dd" chipset="kblgt2" name="TestOa" />
+    <guid config_hash="d36b63d76294172be0ad5e6530109d06" mdapi_config_hash="aa4c1ab961a066b0bc98bf914735b6af" id="6c66fe6e-2988-454a-bfae-7fca3bbcbec2" chipset="kblgt2" name="GpuBusyness" />
+    <guid config_hash="8ae5bda74271c473f88f13e57d6f6828" mdapi_config_hash="4d9fb617c64406cc8b372808461dd3e3" id="b49aa434-4958-4d98-9e6f-443ff27ca74d" chipset="kblgt2" name="PMA_Stall" />
+    <guid config_hash="73805d7acd1298aa6d81d3e2278ee411" mdapi_config_hash="9111e46468492c1c14a331510c18a49b" id="17b4f3e0-d578-4ae3-b7a8-98d756d1e0df" chipset="kblgt3" name="RenderBasic" />
+    <guid config_hash="b1268f0f246efc7ab27f7637fa7193e8" mdapi_config_hash="ac97e9ebaf2a55476a86ab2559e5ecab" id="a5dc0bc5-d6fa-4f3a-9979-d3248c786042" chipset="kblgt3" name="ComputeBasic" />
+    <guid config_hash="01f86f590b9b0c0371b0075a5e73b902" mdapi_config_hash="808e46d786103380f58d1e8f91402c4c" id="c7c735f3-ce58-45cf-aa04-30b183f1faff" chipset="kblgt3" name="RenderPipeProfile" />
+    <guid config_hash="0a75401250565ee5a0e555b47bc9e5b4" mdapi_config_hash="f810d7343822b3a3b9e50820708bfcb3" id="96ec2219-040b-428a-856a-6bc03363a057" chipset="kblgt3" name="MemoryReads" />
+    <guid config_hash="2ed5869dae575556e0895b0d0081555c" mdapi_config_hash="af6cd36da93a8ec66d57ba6b504b601f" id="03372b64-4996-4d3b-aa18-790e75eeb9c2" chipset="kblgt3" name="MemoryWrites" />
+    <guid config_hash="6566c55fdf1de8ae73008029a674ecc9" mdapi_config_hash="c4d070800ff5b65caff35d40adb52d04" id="31b4ce5a-bd61-4c1f-bb5d-f2e731412150" chipset="kblgt3" name="ComputeExtended" />
+    <guid config_hash="33bdd2160049aa831e025e1be7a453c5" mdapi_config_hash="dcedeef0d1a6b20eaa3f3ee546b048ed" id="2ce0911a-27fc-4887-96f0-11084fa807c3" chipset="kblgt3" name="ComputeL3Cache" />
+    <guid config_hash="c8739d6465605b9228ec2ff3ebde2ba3" mdapi_config_hash="3a893043b806be4b00179663f8f4695e" id="b128f45f-bfa2-4991-aadc-05be7898e398" chipset="kblgt3" name="HDCAndSF" />
+    <guid config_hash="3ead5919c426a00ef6697e21df33ef07" mdapi_config_hash="b97b4654b688f69b1df22e7d9cd08f2b" id="f3566b55-9c13-47bf-8327-4a887af75262" chipset="kblgt3" name="L3_1" />
+    <guid config_hash="2d0a88cdba58ddf18642fde563edb4d8" mdapi_config_hash="f8870bc48196bdc7c3d08bf0dba3e377" id="7b21aa68-9076-4ab4-8a84-e45a06c8eac6" chipset="kblgt3" name="L3_2" />
+    <guid config_hash="d3972886309fa3701f3d3ae185f57cbe" mdapi_config_hash="2091a23cf2f835375430e16328f73c7b" id="71b4b9dd-ae28-48ce-9a1a-5431e1f23afd" chipset="kblgt3" name="L3_3" />
+    <guid config_hash="90ecbd5ae5ae6d3c0f756c7411351c85" mdapi_config_hash="6c748481e5e43019bbeb0557c309b65e" id="52c646ca-52da-4853-877e-8645e73ed330" chipset="kblgt3" name="RasterizerAndPixelBackend" />
+    <guid config_hash="5a628cbf246226c19fed41479cf17de1" mdapi_config_hash="c1ea12cf95f7c8be3ca32c6670c15a27" id="c4bb682f-677c-4875-990b-005230be87b4" chipset="kblgt3" name="Sampler" />
+    <guid config_hash="f48609e1a79093073b96726c3c4c63a6" mdapi_config_hash="20f9812e7c1c94a2b24dbb6a0596b5e1" id="ade8521b-5e72-45d4-8c25-d9f0da774899" chipset="kblgt3" name="TDL_1" />
+    <guid config_hash="93ab6cf80fefdfca540a3ac101925411" mdapi_config_hash="25e39a0a38a1fdbf4e2ff677aad30fc6" id="9df2815d-4e9e-417f-bde1-3788dc6e1ea1" chipset="kblgt3" name="TDL_2" />
+    <guid config_hash="f543908db2541ef48f35603e35c379bd" mdapi_config_hash="41ebe4b58e504d63d60141faa9d45c18" id="efc497ac-884e-4ee4-a4a8-15fba22aaf21" chipset="kblgt3" name="ComputeExtra" />
+    <guid config_hash="16c6718fd82aaa5e1187df8d88ace152" mdapi_config_hash="d0ce6de1ad831394a048015990e82864" id="bfd9764d-2c5b-4c16-bfc1-89de3ca10917" chipset="kblgt3" name="VMEPipe" />
+    <guid config_hash="cca1580576ffa8e25aa271ebdac68cc7" mdapi_config_hash="817cb7526b5399e772ed721e062325b3" id="f1792f32-6db2-4b50-b4b2-557128f1688d" chipset="kblgt3" name="TestOa" />
+    <guid config_hash="de8530fdc36d260415e78771e8cc6929" mdapi_config_hash="3f82064fe17d6d7005b6e5c4bb828c5a" id="b55ecba1-2aa9-422e-89ff-b9e30f03d447" chipset="kblgt3" name="GpuBusyness" />
+    <guid config_hash="8ae5bda74271c473f88f13e57d6f6828" mdapi_config_hash="4d9fb617c64406cc8b372808461dd3e3" id="85bc2e4f-2563-4388-921b-dc0dad879cf3" chipset="kblgt3" name="PMA_Stall" />
+    <guid config_hash="c01efa1ec2a11ea9aaab8b0a8e548174" mdapi_config_hash="7867725687bd177e4e8b8b8443b04355" id="d72df5c7-5b4a-4274-a43f-00b0fd51fc68" chipset="glk" name="RenderBasic" />
+    <guid config_hash="cde046a01aba9c56d6fa44bf2c0f26c2" mdapi_config_hash="84d270fda538f1061067316b19b9cac9" id="814285f6-354d-41d2-ba49-e24e622714a0" chipset="glk" name="ComputeBasic" />
+    <guid config_hash="1669463a6836f6d057cbf3e41506923b" mdapi_config_hash="66b8f785edc91d1cf3952fc842114671" id="07d397a6-b3e6-49f6-9433-a4f293d55978" chipset="glk" name="RenderPipeProfile" />
+    <guid config_hash="f9eee3f0c9653ffd05e4876be0ea44d5" mdapi_config_hash="1056f30306a4c2d08d57e4faa86f983a" id="1a356946-5428-450b-a2f0-89f8783a302d" chipset="glk" name="MemoryReads" />
+    <guid config_hash="03e840f1d8597b3c6c4015792243ce7d" mdapi_config_hash="3a432ab2a6296f25755c1846385fae55" id="5299be9d-7a61-4c99-9f81-f87e6c5aaca9" chipset="glk" name="MemoryWrites" />
+    <guid config_hash="39a03c065f1fdb5bf680207dc520cdb2" mdapi_config_hash="ed01dd3479766a5fb38dd8e9e064786e" id="bc9bcff2-459a-4cbc-986d-a84b077153f3" chipset="glk" name="ComputeExtended" />
+    <guid config_hash="c241c2999f487dc995cecdb35b01197b" mdapi_config_hash="3a74134eedb02e201197da17e0940351" id="88ec931f-5b4a-453a-9db6-a61232b6143d" chipset="glk" name="ComputeL3Cache" />
+    <guid config_hash="37dc8ae76c2554b11ecea682f1349ece" mdapi_config_hash="fd61133e8762cb61d142a12604442177" id="0329ea02-ebb8-43f1-bf89-c5bdcccd3eb4" chipset="glk" name="HDCAndSF" />
+    <guid config_hash="d159b7f14e97660ae2887e4b610d2721" mdapi_config_hash="fe48f1232b010e9d10ab1bff0e6efb75" id="5e57a25a-1d18-4e94-b84b-08ea66751b8c" chipset="glk" name="L3_1" />
+    <guid config_hash="1dc29cbbceb8e2e1a78d679ead80a27b" mdapi_config_hash="2a635538209cc68b2c489d2326017539" id="f0652373-d361-426f-b36d-9ffec288bdc6" chipset="glk" name="RasterizerAndPixelBackend" />
+    <guid config_hash="0b9e45ed32513193354be363e288b6a6" mdapi_config_hash="593e37453b96243ac7752d9c45672c63" id="6ac97d12-ce13-428a-b20c-6902bde2608b" chipset="glk" name="Sampler" />
+    <guid config_hash="3f01b8d28fa285e7a496081574de4c1b" mdapi_config_hash="af87c7792e604a645dacdadb99c4afd2" id="59ea703a-9a35-4aed-a985-0d9ab7aceaba" chipset="glk" name="TDL_1" />
+    <guid config_hash="0c77cba2d8886c18df9f382ce90eac66" mdapi_config_hash="2e2beadb54378ff4d79bf4cf15bffd90" id="f2d6d718-e7b1-48f4-9624-45230d2fe2a0" chipset="glk" name="TDL_2" />
+    <guid config_hash="a19a55aad269ccc1ed4380314eda4bed" mdapi_config_hash="ac34c2028f3f4fae92e58aae1496901b" id="15274c82-27d2-4819-876a-7cb1a2c59ba4" chipset="glk" name="ComputeExtra" />
+    <guid config_hash="e018d083414e4d28e0ed481554128883" mdapi_config_hash="dce59e977ffff25a57f2486f5d9a7c60" id="dd3fd789-e783-4204-8cd0-b671bbccb0cf" chipset="glk" name="TestOa" />
+    <guid config_hash="6d13f443205926fd1351ae5adeae8965" mdapi_config_hash="24f384a77963d7d64c324b3d89eeb498" id="e6868953-fb47-431d-a060-f785916558fc" chipset="glk" name="PMA_Stall" />
+    <guid config_hash="afbe2cb999a8303f52eea075f3b8687e" mdapi_config_hash="8e8f1f5eb1b0a95dada8e3ddd78f4dd8" id="7fa796a4-0c7a-4201-afc6-cff0b2f528a2" chipset="cflgt2" name="RenderBasic" />
+    <guid config_hash="b1268f0f246efc7ab27f7637fa7193e8" mdapi_config_hash="87718bbf001284c0ca7c0e8060ebe6c6" id="a4985100-5f76-4822-8ca7-67908cb26274" chipset="cflgt2" name="ComputeBasic" />
+    <guid config_hash="01f86f590b9b0c0371b0075a5e73b902" mdapi_config_hash="f9a35b936db9a2f76b69d7b5bd5d10ec" id="2221e4d5-ed7b-445e-b2cc-3de1b97f4d42" chipset="cflgt2" name="RenderPipeProfile" />
+    <guid config_hash="0a75401250565ee5a0e555b47bc9e5b4" mdapi_config_hash="8b1e5617e61646d7d7d0361107ec2b67" id="82096a90-e2fa-4f38-ac14-562b2496933a" chipset="cflgt2" name="MemoryReads" />
+    <guid config_hash="2ed5869dae575556e0895b0d0081555c" mdapi_config_hash="2cd637a11aacc15af119c9dba70c5f1d" id="9f638880-02e9-4a8d-896a-7670a3bf0d35" chipset="cflgt2" name="MemoryWrites" />
+    <guid config_hash="6566c55fdf1de8ae73008029a674ecc9" mdapi_config_hash="5311aa266d0d85e7b67695731408ec3e" id="8d4ad934-7c16-43d5-845a-51067a4c8e2f" chipset="cflgt2" name="ComputeExtended" />
+    <guid config_hash="33bdd2160049aa831e025e1be7a453c5" mdapi_config_hash="019cd29f8fe235d7dca74e7860dafc08" id="4389cf07-1424-4963-b2d2-64fcec75406d" chipset="cflgt2" name="ComputeL3Cache" />
+    <guid config_hash="5736948ed298fd6e8cc80222e1e03077" mdapi_config_hash="4118768c8cfd35668067034b646a99ea" id="ac544b3a-ff78-46ea-9808-ee6fef0978b4" chipset="cflgt2" name="HDCAndSF" />
+    <guid config_hash="3ead5919c426a00ef6697e21df33ef07" mdapi_config_hash="fe8bb34c7f8bb873a55e7b7046ec4507" id="a35c5867-0ab8-4d45-8fc1-eb0906f0eff5" chipset="cflgt2" name="L3_1" />
+    <guid config_hash="2d0a88cdba58ddf18642fde563edb4d8" mdapi_config_hash="d4b1fe90832f2ab808b5dc6d6f2de431" id="bb4bcce9-2cbb-4818-9e49-67ce2c99cd25" chipset="cflgt2" name="L3_2" />
+    <guid config_hash="d3972886309fa3701f3d3ae185f57cbe" mdapi_config_hash="0a733ec395a9f95c9a4c7a53639352aa" id="9e1229f8-d87f-4f44-b067-3544e17195aa" chipset="cflgt2" name="L3_3" />
+    <guid config_hash="90ecbd5ae5ae6d3c0f756c7411351c85" mdapi_config_hash="86e99a03089772a7bff973a24bbcb21f" id="3e91908a-1c70-4004-b2ab-a10ef14f24f9" chipset="cflgt2" name="RasterizerAndPixelBackend" />
+    <guid config_hash="5a628cbf246226c19fed41479cf17de1" mdapi_config_hash="07cab9aa8c9c07b346ce2e8976ef87fa" id="9a6ba957-7955-4a09-a8ce-083030ba3c1f" chipset="cflgt2" name="Sampler" />
+    <guid config_hash="f48609e1a79093073b96726c3c4c63a6" mdapi_config_hash="8e2985ac9a60942987f94a397bfeb2ff" id="c54e7ca3-c60c-4396-ac3d-f9899c9a6ee4" chipset="cflgt2" name="TDL_1" />
+    <guid config_hash="93ab6cf80fefdfca540a3ac101925411" mdapi_config_hash="775f1d07ed4d225976adf356e8dc9df5" id="e438cd5d-1da7-46c6-9823-4780f370d11d" chipset="cflgt2" name="TDL_2" />
+    <guid config_hash="483a06910590c1753a0266ef8b9f9b70" mdapi_config_hash="4be337ed83e3c95aebf66553ed685602" id="5f679fb0-909e-4c0e-b4b2-8e801f83e71b" chipset="cflgt2" name="ComputeExtra" />
+    <guid config_hash="784698b7fb41dad7bc4bf13fac46657b" mdapi_config_hash="2fe32bdaf82fc66774ee95c33a23ea88" id="0d09ba9a-1d1c-457d-83e2-74ac448014d6" chipset="cflgt2" name="VMEPipe" />
+    <guid config_hash="d36b63d76294172be0ad5e6530109d06" mdapi_config_hash="aa4c1ab961a066b0bc98bf914735b6af" id="e2f162ae-5732-4af0-8b11-69510f57094a" chipset="cflgt2" name="GpuBusyness" />
+    <guid config_hash="cca1580576ffa8e25aa271ebdac68cc7" mdapi_config_hash="5f4afc2f159098e96b8fd90a85979ae3" id="74fb4902-d3d3-4237-9e90-cbdc68d0a446" chipset="cflgt2" name="TestOa" />
+    <guid config_hash="8ae5bda74271c473f88f13e57d6f6828" mdapi_config_hash="4d9fb617c64406cc8b372808461dd3e3" id="5ccbf9fb-6bf2-456b-a749-bdff7b1aff13" chipset="cflgt2" name="PMA_Stall" />
+    <guid config_hash="73805d7acd1298aa6d81d3e2278ee411" mdapi_config_hash="5d3d4bcf1e36569409cfd84a7e137ade" id="b316bcab-212f-4228-97de-af6b5a1a2ea1" chipset="cflgt3" name="RenderBasic" />
+    <guid config_hash="b1268f0f246efc7ab27f7637fa7193e8" mdapi_config_hash="4a9628256274ffe348e8dc21f0f22f3b" id="d2eec5b1-4dd8-4170-ae83-9531abd0692f" chipset="cflgt3" name="ComputeBasic" />
+    <guid config_hash="01f86f590b9b0c0371b0075a5e73b902" mdapi_config_hash="498feca145a69e7fcec55b79d239d005" id="9875e050-b1bc-45e6-a6ab-665594601df9" chipset="cflgt3" name="RenderPipeProfile" />
+    <guid config_hash="0a75401250565ee5a0e555b47bc9e5b4" mdapi_config_hash="610a6fcb593c50362beb8c0e2172685a" id="49c65f34-e625-4ca4-86b7-88693e624d4c" chipset="cflgt3" name="MemoryReads" />
+    <guid config_hash="2ed5869dae575556e0895b0d0081555c" mdapi_config_hash="d3b21fcad90e080ef31d74b9ebd6f9ba" id="45c9e8ee-2998-4d83-88e8-9cb7e03287bf" chipset="cflgt3" name="MemoryWrites" />
+    <guid config_hash="6566c55fdf1de8ae73008029a674ecc9" mdapi_config_hash="7c26cd39edceac6865beb355592d2bea" id="bac415ce-d7a2-4f8d-9b16-834deba7330e" chipset="cflgt3" name="ComputeExtended" />
+    <guid config_hash="33bdd2160049aa831e025e1be7a453c5" mdapi_config_hash="1013698045cad3a9935f5cd76ceb8331" id="a8cfca44-0e74-4338-9e57-3daad98957dd" chipset="cflgt3" name="ComputeL3Cache" />
+    <guid config_hash="c8739d6465605b9228ec2ff3ebde2ba3" mdapi_config_hash="6c4d2ca081899cddb7c730b7c9e11b35" id="c4bee67c-0de6-4bc2-9900-5388dcc8adca" chipset="cflgt3" name="HDCAndSF" />
+    <guid config_hash="3ead5919c426a00ef6697e21df33ef07" mdapi_config_hash="74d87a1c8c2eb43fc0d481a88e635cc4" id="2f77a650-54a6-4777-98dc-e49000c13ceb" chipset="cflgt3" name="L3_1" />
+    <guid config_hash="2d0a88cdba58ddf18642fde563edb4d8" mdapi_config_hash="e2ccd67d442ca19acc63a9b3556ce2cb" id="61cf6b31-9ddd-4deb-bae5-7339dd1f63b3" chipset="cflgt3" name="L3_2" />
+    <guid config_hash="d3972886309fa3701f3d3ae185f57cbe" mdapi_config_hash="fda9efbaddee05cf0c58b0b5ba63267a" id="1421ea8b-a4c9-4383-922a-60ba96c42f24" chipset="cflgt3" name="L3_3" />
+    <guid config_hash="90ecbd5ae5ae6d3c0f756c7411351c85" mdapi_config_hash="04d6c2564113599d8375138bcf87e0a5" id="6e1f0a90-c65f-4da9-86d0-c79b3c0063f6" chipset="cflgt3" name="RasterizerAndPixelBackend" />
+    <guid config_hash="5a628cbf246226c19fed41479cf17de1" mdapi_config_hash="9aa750e153f190ac1aeb54a87f778c8f" id="7cb05eab-0857-4189-93bc-09326d298637" chipset="cflgt3" name="Sampler" />
+    <guid config_hash="f48609e1a79093073b96726c3c4c63a6" mdapi_config_hash="88333263dd73a05cb7df643794d2eefa" id="05a06d02-0c12-486b-bb1d-9be053848980" chipset="cflgt3" name="TDL_1" />
+    <guid config_hash="93ab6cf80fefdfca540a3ac101925411" mdapi_config_hash="6750a43049c53c8cb8f966764bf7cf8f" id="cddbd1dc-41a2-4fe4-8b05-3d2773120814" chipset="cflgt3" name="TDL_2" />
+    <guid config_hash="f543908db2541ef48f35603e35c379bd" mdapi_config_hash="e3197d98aa86acaf090f1bffde854586" id="e61ae394-9d9e-4204-a735-1dad7e44d953" chipset="cflgt3" name="ComputeExtra" />
+    <guid config_hash="16c6718fd82aaa5e1187df8d88ace152" mdapi_config_hash="d0ce6de1ad831394a048015990e82864" id="94272ad9-45ee-4e34-b7a7-51546cd6405c" chipset="cflgt3" name="VMEPipe" />
+    <guid config_hash="de8530fdc36d260415e78771e8cc6929" mdapi_config_hash="3f82064fe17d6d7005b6e5c4bb828c5a" id="22b7e0c2-cade-425f-b099-34479768c72a" chipset="cflgt3" name="GpuBusyness" />
+    <guid config_hash="cca1580576ffa8e25aa271ebdac68cc7" mdapi_config_hash="228710e94277d74bd4be0c2536a3edd4" id="577e8e2c-3fa0-4875-8743-3538d585e3b0" chipset="cflgt3" name="TestOa" />
+    <guid config_hash="8ae5bda74271c473f88f13e57d6f6828" mdapi_config_hash="4d9fb617c64406cc8b372808461dd3e3" id="c11af8d1-858b-4f8b-98fb-8d683ba8bda0" chipset="cflgt3" name="PMA_Stall" />
+    <guid config_hash="428ad0859c9dac4ba85dd73106f5b2de" mdapi_config_hash="7baf473e87d0838b628bd2ed289f4783" id="2d975e19-7130-41d2-b06f-79d74f91e7c8" chipset="cnl" name="RenderBasic" />
+    <guid config_hash="7365cff2873ed22304dcb350ca19d834" mdapi_config_hash="174f9ff2125d06a7886a258304ba4eae" id="eed14f91-5f03-4e3a-8281-ac38030ac573" chipset="cnl" name="ComputeBasic" />
+    <guid config_hash="1878c620a9f0cc5100fba47c83a1457c" mdapi_config_hash="f1baa55e099488db74fd02c9560df40b" id="0666ccac-f5aa-4dc2-aa12-c6e058f383f3" chipset="cnl" name="RenderPipeProfile" />
+    <guid config_hash="10d83436d03f71bc19e6b83739072556" mdapi_config_hash="7f0796f55071a69b76c0a0615b2171e6" id="3500dcfd-837b-4ec8-b5cf-fe58b966263f" chipset="cnl" name="MemoryReads" />
+    <guid config_hash="e1c4bd09bd777f97d6c6491bf921ec6b" mdapi_config_hash="92754b4c69ef3427efdee08033daf7e2" id="63d18ead-3cfc-4972-a640-5e98b688dfee" chipset="cnl" name="MemoryWrites" />
+    <guid config_hash="01c5575fa201196b2a4b708001ef810f" mdapi_config_hash="f7fc9c2349a53c37bd020660a0990356" id="1b4d1280-6bbd-4d57-90c6-a03ed6059688" chipset="cnl" name="ComputeExtended" />
+    <guid config_hash="21c0efc6587cd42844e23251b3712b72" mdapi_config_hash="c3d136f1cda81821d08595bc4c29973a" id="f3b31b5a-00b3-4fb4-81fd-6446e505534c" chipset="cnl" name="ComputeL3Cache" />
+    <guid config_hash="0813a24fac91efc4f1dfb7dbb578f08d" mdapi_config_hash="417896f2fec55d50f844eb2344287731" id="890094c5-8615-4f69-a8b9-706c5bcbd713" chipset="cnl" name="HDCAndSF" />
+    <guid config_hash="fb9e04dafcf3519c30c215cb2094a881" mdapi_config_hash="65bd9bbb664fd329464d18e07dd9ac47" id="e56f7dd7-ff55-4bae-89a1-a526a2e3b0d6" chipset="cnl" name="L3_1" />
+    <guid config_hash="28ade5f07e44ef07814f7a307a06470c" mdapi_config_hash="24f525009f45d22253ff7c09951733c9" id="918834e2-a1a4-4d77-9f3a-0c229f8d803f" chipset="cnl" name="L3_2" />
+    <guid config_hash="7f9fb1f70df8efb8cbd236ee8920c349" mdapi_config_hash="20e9d5975e60292c3aaecfc766d2d960" id="2e95713a-c6d8-47a9-9207-eba3e208be51" chipset="cnl" name="RasterizerAndPixelBackend" />
+    <guid config_hash="c6bda99f4d7656d8b1b613c17c2d53da" mdapi_config_hash="2c48df889c497b3f97d5a350827d8f05" id="9bcf4ff2-c15f-4bea-8ec8-8db87791942e" chipset="cnl" name="Sampler" />
+    <guid config_hash="4bfffb81b9376af931bad919fc66ef3f" mdapi_config_hash="33d7ba5d98519f3038ed07f273fe5f91" id="c46c7bb5-f26d-4634-b491-902394af85b1" chipset="cnl" name="TDL_1" />
+    <guid config_hash="e5419b6c232500a6a824c2c58f3b7d32" mdapi_config_hash="b9a01044b9befe9fcf952f26ba4fcc4e" id="aa2d6ab4-99b3-42f8-94d6-4a9aa2baedaf" chipset="cnl" name="TDL_2" />
+    <guid config_hash="ccb9fdae1fe1f44c4c32bdc69befc160" mdapi_config_hash="9cf34989f5e721e734d4edf26036c2c5" id="db41edd4-d8e7-4730-ad11-b9a2d6833503" chipset="cnl" name="TestOa" />
+    <guid config_hash="eaaf4df3ac5e9b4fd52d980f0be72dbf" mdapi_config_hash="8ef6088f425f2a97b01bed560ad6e2b3" id="193093b2-da24-49bf-b407-442c213b71b4" chipset="icl" name="RenderBasic" />
+    <guid config_hash="8b7f8030265ee506c24ec10d17ab8f1a" mdapi_config_hash="f22218a44add1267d4fad705b511323c" id="12ca7e9c-55cb-45cd-9f87-4fc821488e6d" chipset="icl" name="ComputeBasic" />
+    <guid config_hash="3b6635eb3709f346076901ea88ec1f2b" mdapi_config_hash="402f156b276dfaaaf84eb09ec5347515" id="43eb7fc1-dc5e-45e2-a90a-0053f5397271" chipset="icl" name="ComputeExtended" />
+    <guid config_hash="0e47ea7e90aac987097968a231d2dada" mdapi_config_hash="08ff26b1c2405cc1061e71940cf558b5" id="05d5e01f-0800-4975-b36b-7b169cad3fab" chipset="icl" name="ComputeL3Cache" />
+    <guid config_hash="34c5bc89788487e6d32ea9894929b1ae" mdapi_config_hash="0b8dc07dcfe3a03bf65771ee8404fa10" id="03c7a167-2abc-4ba6-878a-f1d80082abca" chipset="icl" name="RenderPipeProfile" />
+    <guid config_hash="dfb00108bfdc1c652f9550bf5ec9262f" mdapi_config_hash="9b4b61a06cf60de356d48995441e6724" id="c5cbc488-6569-41dd-9128-42bf6f0d317c" chipset="icl" name="HDCAndSF" />
+    <guid config_hash="8818a97d48d99673e220075b0ba71eb3" mdapi_config_hash="d3e8cc994e923fc2f79f086273b62ece" id="0316ce4f-e03f-4738-8262-13528fce8eea" chipset="icl" name="RasterizerAndPixelBackend" />
+    <guid config_hash="e1436790af3b1bbea5a0262704c213b1" mdapi_config_hash="7b7377687e294a3c2ee88e0715a65f01" id="21d69ec3-91e1-48a8-acd6-c0c4ec6e819a" chipset="icl" name="L3_1" />
+    <guid config_hash="5ef586cc746e34ab542586805cb26c8e" mdapi_config_hash="06190180046d22f3155558f2211abc30" id="e60e9155-6830-4aec-baf2-1c3c15a73869" chipset="icl" name="L3_2" />
+    <guid config_hash="abdae7b3820fd860c6fec7a98f9654bf" mdapi_config_hash="5cf54f89d0c9ebeeebc46bfde154fdf2" id="47c364d5-1799-4d17-9447-add9358c6451" chipset="icl" name="L3_3" />
+    <guid config_hash="8b3ca983367a86a4dc4c80fe2a4cfbbb" mdapi_config_hash="397319e33a2d28c3602837be8737b559" id="e5ab5c08-3130-4469-8eaf-b23d3dc817d4" chipset="icl" name="L3_4" />
+    <guid config_hash="c5b76b0b898d48bd6305b7208f338584" mdapi_config_hash="9870c08d2dbb2de9836e8effdc5074a8" id="6cdf23c1-f725-414c-959a-c90fa5571b1f" chipset="icl" name="L3_5" />
+    <guid config_hash="667224b11f675b2ac565e18624fad738" mdapi_config_hash="e49091662060a5c502da58bd613abc7f" id="51a2eb6d-9fad-4489-8f22-ab845fe7882a" chipset="icl" name="Sampler_1" />
+    <guid config_hash="e6910b0739c288d68194e64933845380" mdapi_config_hash="d55ee03d24efe992a4029534908c2550" id="afc0f021-8c33-4d60-803d-93487f96c7c1" chipset="icl" name="Sampler_2" />
+    <guid config_hash="525a9fe5285599f695330c45ba2e8b62" mdapi_config_hash="6aa36798625267734b4d066d9090c0bd" id="eddc2f32-b196-4a72-9bf8-21770e35f8bd" chipset="icl" name="TDL_1" />
+    <guid config_hash="b141825840f912e9d7c98a13ae34d600" mdapi_config_hash="af8ee9d86606564460ce2928023e47a5" id="c6d3af7b-037b-4656-95e1-4f838f0a2c14" chipset="icl" name="TDL_2" />
+    <guid config_hash="d2188fa3c865ef430532b127a3fd87a5" mdapi_config_hash="ff33e47c767f6f81d9a779153aae6fdb" id="fd25ec19-3ed1-40c9-8648-1d2387449a92" chipset="icl" name="TDL_3" />
+    <guid config_hash="b421b29d8557dbbf0fe3068c82b3d8dd" mdapi_config_hash="cc850ab4463c23e6017f069d67785c31" id="40dc79f2-88c8-47c6-8f86-f509e39fbe5d" chipset="icl" name="GpuBusyness" />
+    <guid config_hash="7480125fc0806a347f975dc714568e92" mdapi_config_hash="c6b1c7a22e3c2f456cbfdae1bfe394ac" id="3c0bf614-5d67-4326-887f-a24eb8a58244" chipset="icl" name="TestOa" />
+    <guid config_hash="cf5cc66e29088080b9de32aca9c20fdf" mdapi_config_hash="4d959fed7563ce4c6f34e9d9c1c504a6" id="daf004fb-fc9f-45e0-b842-1770e6d273c2" chipset="tgl" name="RenderBasic" />
+    <guid config_hash="7fbc387f30cec97fff537e0609e7b622" mdapi_config_hash="4b584fd8c71948d5bec22a415f6ef3a0" id="6ad92fc0-ed62-460c-b774-5353534c67ed" chipset="tgl" name="ComputeBasic" />
+    <guid config_hash="87de7aad82eabfb9e8ca28470298c833" mdapi_config_hash="b340b1eac0b354f04e9767f14a42a6e6" id="77ae98cf-9a9e-4e35-be85-597b09ffbe53" chipset="tgl" name="RenderPipeProfile" />
+    <guid config_hash="4bd795338e2cf42726894fedccdd223f" mdapi_config_hash="d6c3023d3da8fda32655bfa1fad4e514" id="dedd95cd-1bd4-4e65-be7f-1fd7aa43fe12" chipset="tgl" name="HDCAndSF" />
+    <guid config_hash="36994d80bab156fab0dbe815184a7303" mdapi_config_hash="739afc9fff139a9b9c8a2d72297abb78" id="a889ccb3-5ebd-437f-b5c6-e951fba822f5" chipset="tgl" name="RasterizerAndPixelBackend" />
+    <guid config_hash="54690c67418eb1b8fb23d9c6b47f07d2" mdapi_config_hash="745b6634b3b72399f738761f4565e924" id="feee2629-03a8-4d31-ab4d-7d16572163fb" chipset="tgl" name="L3_1" />
+    <guid config_hash="13cfb577c221a881210d1f31600a2207" mdapi_config_hash="4b527bab2ce2a95aeeb7764f1d4abf23" id="5266f235-1711-4eef-9493-ebdf0238d512" chipset="tgl" name="L3_2" />
+    <guid config_hash="6402b8deefae23be4db362c3fd853b89" mdapi_config_hash="b21101ed0007ddb167044b476654bd8f" id="9c2cd379-bf93-4ded-b481-f64efd534c4a" chipset="tgl" name="L3_3" />
+    <guid config_hash="9f9021d53f1970e1c9f7e4ea1a8ba24d" mdapi_config_hash="71f1cc0729c56e695307c981f0f410a6" id="6a68185d-0056-4891-a5f6-29aa1e1d81ae" chipset="tgl" name="L3_4" />
+    <guid config_hash="b23742dad95e7fc75edd65fa4dc367b7" mdapi_config_hash="7198d15717542985e3ba8308fa95b3a2" id="3f17a326-ae8b-4869-9f5a-3bccf793e287" chipset="tgl" name="L3_5" />
+    <guid config_hash="6c0871403663ab1617a98afa14b01e42" mdapi_config_hash="0383f07caf50fd4f6818a2138f418409" id="d312c40a-9fb7-489a-9a1a-9cd80aac6d61" chipset="tgl" name="L3_6" />
+    <guid config_hash="b1c971413433261918b4de26d99a4388" mdapi_config_hash="b6833e7b89fc08aa05b8e5c8d200071d" id="f0f255a4-535c-43ed-9d6b-85958cef6c1c" chipset="tgl" name="Sampler_1" />
+    <guid config_hash="8f5e405d5ece3fbd0586a1ca279db170" mdapi_config_hash="44f2a86d917ab0a44332d027036d9c32" id="f47c6b97-fc10-4962-bb67-d623e9d6219b" chipset="tgl" name="Sampler_2" />
+    <guid config_hash="185968c3897d41bcf4b84a5bf23187bb" mdapi_config_hash="64c55773613e6a431df5436de5ff8e8c" id="2e49d25e-93e8-4e2b-b91b-51731f5fb315" chipset="tgl" name="TDL_1" />
+    <guid config_hash="8f99569076014439129d68470313013b" mdapi_config_hash="0ff455e43a1ef70d60afc871bd7a1293" id="2a42ff25-99b1-4048-a121-f0664ed42c90" chipset="tgl" name="TDL_2" />
+    <guid config_hash="d1c4956992d95bf782ae915e306a5343" mdapi_config_hash="3ca22a297940fee9b8d8d78106a93003" id="b763fa13-834e-4468-bba6-5f0d40db9813" chipset="tgl" name="TDL_3" />
+    <guid config_hash="e9992e7e1c679eec0ac61356a3905731" mdapi_config_hash="9328c3e2f515349dd60c6468bad254c7" id="cc935a3e-8d96-4b47-bc46-3d84247e9a3a" chipset="tgl" name="GpuBusyness" />
+    <guid config_hash="185673d9c229adff444a595e6c217439" mdapi_config_hash="51644bc87975e69064d0575227a663f9" id="30801299-fe7b-40ba-8a6c-64c6196f3748" chipset="tgl" name="TestOa" />
+    <guid config_hash="25380f09a9ab454374c78f1b5d1c4ddf" mdapi_config_hash="4d28665f4702ddf38239e5c47384dc15" id="807f52f4-e457-4da4-b2b6-9a7b6dc2b1ed" chipset="lkf" name="RenderBasic" />
+    <guid config_hash="ab51b924d738415bd6528d40401424f3" mdapi_config_hash="5e2764fea42c32327564ca99548b8846" id="3d5fa517-a3e5-4d90-9ad0-b4c3d114ba9d" chipset="lkf" name="ComputeBasic" />
+    <guid config_hash="9b6d58e5047c130f47999e04b92151e8" mdapi_config_hash="7bf6ffff6913e5536d4ad4dc4fa3b03b" id="2ab52087-3700-4db4-8dda-f73b77edfd93" chipset="lkf" name="ComputeExtended" />
+    <guid config_hash="1819d0fc7e1274aaed4dc79670eb4d33" mdapi_config_hash="6ff2fcd2498448af0ed284e69be555a8" id="498aa71d-ae5c-4523-a246-33fb2769a386" chipset="lkf" name="ComputeL3Cache" />
+    <guid config_hash="93df26813118e45063763661ffce6b77" mdapi_config_hash="d15e72e9d0ba0a4a94ed6985c86690ef" id="045dbb74-1e1a-499c-9a50-bac498e34699" chipset="lkf" name="RenderPipeProfile" />
+    <guid config_hash="91cd4922309b1259d26360831c966532" mdapi_config_hash="bc3b779c816e5763231752dff01b698c" id="63af815c-30f9-4dd5-81fa-351ad6b69b4b" chipset="lkf" name="HDCAndSF" />
+    <guid config_hash="8a7c6d0c784cc13fcb65d3baa8bb44e0" mdapi_config_hash="9aa273f8a120f0a31667c247704bbf6b" id="20df0e83-535f-457f-a08b-76aee88c1e0e" chipset="lkf" name="RasterizerAndPixelBackend" />
+    <guid config_hash="9d588e74e635377125299c5f3aa5c7d6" mdapi_config_hash="ae9e960222e31c486205e0c0f0603138" id="c7d3dc5c-975d-4d3a-a4c8-86fb0085743b" chipset="lkf" name="L3_1" />
+    <guid config_hash="3310298c4729cef20b0f20ddc8658a86" mdapi_config_hash="97d31df77e8723b93d1d215b5e596bd5" id="04003388-30ef-45d6-ae89-86f71ee596f4" chipset="lkf" name="L3_2" />
+    <guid config_hash="5d08c5947d680f307e1a3956cf87b818" mdapi_config_hash="375da2b23bb646620d82fae96f76ceb2" id="12f706a4-3761-4448-83dc-63495da010ff" chipset="lkf" name="L3_3" />
+    <guid config_hash="7ba4d260cd6343472d1e740970b0e7f3" mdapi_config_hash="78e18bf4b7860da80dbdffdef1a57d38" id="b03ae6f7-fdc0-4879-9e65-5b221ac9625f" chipset="lkf" name="L3_4" />
+    <guid config_hash="3890a445c8e58c9d7cefd7c3dcdd07a3" mdapi_config_hash="fd720998c18a22560a36fbf0ebc7346c" id="cdec4315-3c8d-416f-b3ae-33f7590e1439" chipset="lkf" name="L3_5" />
+    <guid config_hash="afa077ca791b2e4ee74ddfaf006d8fe2" mdapi_config_hash="f89f6cde18683374b31354a1a0eb6738" id="377c06c4-5f41-465a-bf2e-60d95200ba94" chipset="lkf" name="Sampler_1" />
+    <guid config_hash="e14383b58aeecf5a983d6ec57e3b2558" mdapi_config_hash="d8162037057cd1550568345e71f20e72" id="58326100-b3e7-4554-b612-592e16dc6fd1" chipset="lkf" name="Sampler_2" />
+    <guid config_hash="dd6e1a4c0aaaa84a36f83bb3772e26f6" mdapi_config_hash="7f0d9b461ff5b0fd927051c95b8f80b1" id="4c71735a-dfbf-4ebe-9df3-6c3db344a466" chipset="lkf" name="TDL_1" />
+    <guid config_hash="39c75fae3e4bc24fce0759413caac64d" mdapi_config_hash="7d8add695c157a7908abfef46b767e28" id="80e75f86-f8bc-4903-bf0f-38fd26cca636" chipset="lkf" name="TDL_2" />
+    <guid config_hash="79df0b5785c2464bedddf7c2ea34fae9" mdapi_config_hash="011bb38aa81c2e56de1e7cf9653a4047" id="9c517add-e263-4cbe-b7f8-9986f737e68a" chipset="lkf" name="TDL_3" />
+    <guid config_hash="051a88dbb1037b1e96ab8742322d5195" mdapi_config_hash="8f1f14586a4a4cbd9603488b87f3a571" id="c3103887-8c7c-482a-b923-3d68dd340598" chipset="lkf" name="GpuBusyness" />
+    <guid config_hash="2f735b47a388ee4876e999e2fe1fdaff" mdapi_config_hash="8d9471fa5f2e9d9ef3bb3be89fbc0372" id="82b6b321-f93e-445a-a285-f30391ef1dc5" chipset="lkf" name="TestOa" />
+</guids>
diff --git a/lib/i915/perf-configs/mdapi-xml-convert.py b/lib/i915/perf-configs/mdapi-xml-convert.py
new file mode 100755
index 00000000..867df286
--- /dev/null
+++ b/lib/i915/perf-configs/mdapi-xml-convert.py
@@ -0,0 +1,1006 @@
+#!/usr/bin/env python2
+
+# Copyright (C) 2015-2016 Intel Corporation
+#
+# Permission is hereby granted, free of charge, to any person obtaining a copy
+# of this software and associated documentation files (the "Software"), to deal
+# in the Software without restriction, including without limitation the rights
+# to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+# copies of the Software, and to permit persons to whom the Software is
+# furnished to do so, subject to the following conditions:
+#
+# The above copyright notice and this permission notice shall be included in
+# all copies or substantial portions of the Software.
+#
+# THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+# IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+# FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+# AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+# LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+# OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+# SOFTWARE.
+
+
+# "MDAPI" xml files are an XML schema for maintaining meta data about Gen
+# graphics Ovservability counters, where MD API is the name of a library shared
+# by Intel GPA and Intel VTune.
+#
+# These files aren't publicly documented and have some historical baggage that
+# adds some complexity as well as being inconsistent in a number of ways that
+# makes it quite a bit of effort to parse/use the data. We also don't have
+# guarantees about how this schema is maintained.
+#
+# We've taken the opportunity to find ways to simplify the input data and to
+# make it more consistent to hopefully reduce the effort involved in using the
+# data downstream.
+#
+
+
+import argparse
+import copy
+import hashlib
+from operator import itemgetter
+import re
+import sys
+import time
+import uuid
+
+import xml.etree.ElementTree as et
+import xml.sax.saxutils as saxutils
+
+import oa_guid_registry as oa_registry
+
+
+# MDAPI configs include writes to some non-config registers,
+# thus the blacklists...
+
+gen8_11_chipset_params = {
+    'a_offset': 16,
+    'b_offset': 192,
+    'c_offset': 224,
+    'oa_report_size': 256,
+    'config_reg_blacklist': {
+        0x2364, # OACTXID
+    },
+}
+
+chipsets = {
+    'HSW': {
+        'a_offset': 12,
+        'b_offset': 192,
+        'c_offset': 224,
+        'oa_report_size': 256,
+        'registers': {
+            # TODO extend the symbol table for nicer output...
+                0x2710: { 'name': 'OASTARTTRIG1' },
+            0x2714: { 'name': 'OASTARTTRIG1' },
+            0x2718: { 'name': 'OASTARTTRIG1' },
+            0x271c: { 'name': 'OASTARTTRIG1' },
+            0x2720: { 'name': 'OASTARTTRIG1' },
+            0x2724: { 'name': 'OASTARTTRIG6' },
+            0x2728: { 'name': 'OASTARTTRIG7' },
+            0x272c: { 'name': 'OASTARTTRIG8' },
+            0x2740: { 'name': 'OAREPORTTRIG1' },
+            0x2744: { 'name': 'OAREPORTTRIG2' },
+            0x2748: { 'name': 'OAREPORTTRIG3' },
+            0x274c: { 'name': 'OAREPORTTRIG4' },
+            0x2750: { 'name': 'OAREPORTTRIG5' },
+            0x2754: { 'name': 'OAREPORTTRIG6' },
+            0x2758: { 'name': 'OAREPORTTRIG7' },
+            0x275c: { 'name': 'OAREPORTTRIG8' },
+            0x2770: { 'name': 'OACEC0_0' },
+            0x2774: { 'name': 'OACEC0_1' },
+            0x2778: { 'name': 'OACEC1_0' },
+            0x277c: { 'name': 'OACEC1_1' },
+            0x2780: { 'name': 'OACEC2_0' },
+            0x2784: { 'name': 'OACEC2_1' },
+            0x2788: { 'name': 'OACEC3_0' },
+            0x278c: { 'name': 'OACEC3_1' },
+            0x2790: { 'name': 'OACEC4_0' },
+            0x2794: { 'name': 'OACEC4_1' },
+            0x2798: { 'name': 'OACEC5_0' },
+            0x279c: { 'name': 'OACEC5_1' },
+            0x27a0: { 'name': 'OACEC6_0' },
+            0x27a4: { 'name': 'OACEC6_1' },
+            0x27a8: { 'name': 'OACEC7_0' },
+            0x27ac: { 'name': 'OACEC7_1' },
+        },
+        'config_reg_blacklist': {
+            0x2364, # OASTATUS1 register
+        },
+    },
+    'BDW': gen8_11_chipset_params,
+    'CHV': gen8_11_chipset_params,
+    'SKLGT2': gen8_11_chipset_params,
+    'SKLGT3': gen8_11_chipset_params,
+    'SKLGT4': gen8_11_chipset_params,
+    'BXT': gen8_11_chipset_params,
+    'KBLGT2': gen8_11_chipset_params,
+    'KBLGT3': gen8_11_chipset_params,
+    'GLK': gen8_11_chipset_params,
+    'CFLGT2': gen8_11_chipset_params,
+    'CFLGT3': gen8_11_chipset_params,
+    'CNL': gen8_11_chipset_params,
+    'ICL': gen8_11_chipset_params,
+    'LKF': gen8_11_chipset_params,
+    'TGL': gen8_11_chipset_params,
+}
+
+register_types = { 'OA', 'NOA', 'FLEX', 'PM' }
+
+default_set_blacklist = { "RenderDX1x", # TODO: rename to something non 'DX'
+                                        # specific if this config is generally
+                                        # usefull
+                          "RenderBalance", # XXX: missing register config
+                          "PipelineTimestamps", # Covered by API timestamp queries
+                        }
+
+counter_blacklist = {
+    "DramLlcThroughput", # TODO: The max equation of this counter
+                         # requires dram throughtput value. Need to
+                         # investiguate how to get this value.
+}
+
+sys_vars = { "EuCoresTotalCount",
+             "EuSlicesTotalCount",
+             "SamplersTotalCount",
+             "EuThreadsCount",
+             "GpuMinFrequencyMHz",
+             "GpuMaxFrequencyMHz",
+             "GpuTimestampFrequency",
+             "SliceMask",
+             "SubsliceMask",
+             "EuSubslicesTotalCount"
+           }
+
+def underscore(name):
+    s = re.sub('MHz', 'Mhz', name)
+    s = re.sub('\.', '_', s)
+    s = re.sub('(.)([A-Z][a-z]+)', r'\1_\2', s)
+    return re.sub('([a-z0-9])([A-Z])', r'\1_\2', s).lower()
+
+def print_err(*args):
+    sys.stderr.write(' '.join(map(str,args)) + '\n')
+
+read_register_offsets = {
+    0x1f0: 'PERFCNT1',
+    0x1f8: 'PERFCNT2',
+}
+
+def read_value(chipset, offset):
+    if offset in read_register_offsets:
+        return read_register_offsets[offset]
+    print_err("Unknown offset register at offset {0}".format(offset))
+    assert 0
+
+
+def read_token_to_rpn_read(chipset, token, raw_offsets):
+    width, offset_str = token.split('@')
+
+    # For Broadwell the raw read notation was extended for 40 bit
+    # counters: rd40@<32bit_part1_offset>:<8bit_part2_offset>
+    if width == "rd40":
+        offset_32_str, offset_8_str = offset_str.split(':')
+        offset_str = offset_32_str
+
+    offset = int(offset_str, 16)
+
+    if raw_offsets:
+        a_offset = chipsets[chipset]['a_offset']
+        b_offset = chipsets[chipset]['b_offset']
+        c_offset = chipsets[chipset]['c_offset']
+        report_size = chipsets[chipset]['oa_report_size']
+
+        if offset < a_offset:
+            if offset == 4:
+                return "GPU_TIME 0 READ"
+            elif offset == 12:
+                assert chipset != "HSW" # Only for Gen8+
+                return "GPU_CLOCK 0 READ"
+            else:
+                assert 0
+        elif offset < b_offset:
+            return "A " + str((offset - a_offset) / 4) + " READ"
+        elif offset < c_offset:
+            return "B " + str((offset - b_offset) / 4) + " READ"
+        elif offset < report_size:
+            return "C " + str((offset - c_offset) / 4) + " READ"
+        else:
+            return "{0} READ_REG".format(read_value(chipset, offset))
+    else:
+        idx = offset / 8
+        if chipset == "HSW":
+            # On Haswell accumulated counters are assumed to start
+            # with GPU_TIME followed by 45 A counters, then 8 B
+            # counters and finally 8 C counters.
+            if idx < 1:
+                return "GPU_TIME 0 READ"
+            elif idx < 46:
+                return "A " + str(idx - 1) + " READ"
+            elif idx < 54:
+                return "B " + str(idx - 46) + " READ"
+            elif idx < 62:
+                return "C " + str(idx - 54) + " READ"
+            else:
+                return "{0} READ_REG".format(read_value(chipset, offset))
+        else:
+            # For Gen8+ the array of accumulated counters is
+            # assumed to start with a GPU_TIME then GPU_CLOCK,
+            # then 36 A counters, then 8 B counters and finally
+            # 8 C counters.
+            if idx == 0:
+                return "GPU_TIME 0 READ"
+            elif idx == 1:
+                return "GPU_CLOCK 0 READ"
+            elif idx < 38:
+                return "A " + str(idx - 2) + " READ"
+            elif idx < 46:
+                return "B " + str(idx - 38) + " READ"
+            elif idx < 54:
+                return "C " + str(idx - 46) + " READ"
+            else:
+                return "{0} READ_REG".format(read_value(chipset, offset))
+
+    assert 0
+
+def replace_read_tokens_with_rpn_read_ops(chipset, equation, raw_offsets):
+    # MDAPI MetricSet equations use tokens like 'dw at 0xff' for reading raw
+    # values from snapshots, but this doesn't seem convenient for a few
+    # reasons:
+    #
+    # 1) The offsets hide the particular a, b, or c counter they
+    #    correspond to which in turn makes it awkward to experiment
+    #    with different report sizes which trade off how many a, b and
+    #    c counters are available
+    #
+    # 2) Raw reads could be represented as RPN operations too, and
+    #    the consistency could make them slightly easier for tools to
+    #    handle, E.g:
+    #
+    #      "A 5 READ" = read A counter 5
+    #
+    # We replace dw@ address tokens with GPU_TIME, A, B or C READ ops...
+    #
+
+    tokens = equation.split()
+    equation = ""
+
+    for token in tokens:
+        if '@' in token:
+            read_exp = read_token_to_rpn_read(chipset, token, raw_offsets)
+            equation = equation + " " + read_exp
+        else:
+            equation = equation + " " + token
+
+    return equation
+
+
+parser = argparse.ArgumentParser()
+parser.add_argument("xml", nargs="+", help="XML description of metrics")
+parser.add_argument("--guids", required=True, help="Metric set GUID registry")
+parser.add_argument("--whitelist", help="Only output for given, space-separated, sets")
+parser.add_argument("--blacklist", help="Don't generate anything for given metric sets")
+parser.add_argument("--merge", help="Additional meta data to merge into the result")
+parser.add_argument("--dry-run", action="store_true",
+                    help="Not generate new XML but to check any errors")
+
+args = parser.parse_args()
+
+metrics = et.Element('metrics')
+tree = et.ElementTree(metrics)
+
+def apply_aliases(text, aliases):
+    if aliases == None:
+        return text
+
+    for alias in aliases.split(','):
+        (a, b) = alias.split('|')
+        text = re.sub(r"\b%s\b" % re.escape(a), b, text)
+
+        a = a.lower()
+        b = b.lower()
+        text = re.sub(r"\b%s\b" % re.escape(a), b, text)
+
+    return text
+
+def strip_dx_apis(text):
+    if text == None:
+        return ""
+    stripped = ""
+    apis = text.split()
+    for api in apis:
+        if api[:2] != "DX":
+            stripped = stripped + " " + api
+
+    return stripped.strip()
+
+# For recursively appending counters in order of dependencies...
+def append_deps_and_counter(mdapi_counter, mdapi_counters, deps,
+                            sorted_array, sorted_set):
+    symbol_name = mdapi_counter.get('SymbolName')
+
+    if symbol_name in sorted_set:
+        return
+
+    for dep_name in deps[symbol_name]:
+        if dep_name in mdapi_counters:
+            append_deps_and_counter(mdapi_counters[dep_name], mdapi_counters, deps,
+                                    sorted_array, sorted_set)
+
+    sorted_array.append(mdapi_counter)
+    sorted_set[symbol_name] = mdapi_counter
+
+def sort_counters(mdapi_counters, deps):
+    sorted_array = []
+    sorted_set = {} # counters in here have been added to array
+    for symbol_name in mdapi_counters:
+        append_deps_and_counter(mdapi_counters[symbol_name], mdapi_counters, deps,
+                                sorted_array, sorted_set)
+
+    return sorted_array
+
+def expand_macros(equation):
+    equation = equation.replace('GpuDuration', "$Self 100 UMUL $GpuCoreClocks FDIV")
+    equation = equation.replace('EuAggrDuration', "$Self $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV")
+    return equation
+
+def fixup_equation(equation):
+    if equation is None:
+        return None
+    return equation.replace('$SubliceMask', '$SubsliceMask')
+
+# The MDAPI XML files sometimes duplicate the same Flex EU/OA regs
+# between configs with different AvailabilityEquations even though the
+# availability checks are only expected to affect the MUX configs
+#
+# We iterate all the configs to filter out the FLEX/OA configs and
+# double check that there's never any variations between repeated
+# configs
+#
+def filter_single_config_registers_of_type(mdapi_metric_set, type):
+    regs = []
+    for mdapi_reg_config in mdapi_metric_set.findall("RegConfigStart"):
+        tmp_regs = []
+        for mdapi_reg in mdapi_reg_config.findall("Register"):
+            reg = (int(mdapi_reg.get('offset'),16), int(mdapi_reg.get('value'),16))
+
+            if reg[0] in chipsets[chipset]['config_reg_blacklist']:
+                continue
+
+            if mdapi_reg.get('type') == type:
+                tmp_regs.append(reg)
+
+        if len(tmp_regs) > 0:
+            bad = False
+            if len(regs) == 0:
+                regs = tmp_regs
+            elif len(regs) != len(tmp_regs):
+                bad = True
+            else:
+                for i in xrange(0, len(regs)):
+                    if regs[i] != tmp_regs[i]:
+                        bad = True
+                        break
+            if bad:
+                print_err("ERROR: multiple, differing FLEX/OA configs for one set: MetricSet=\"" + mdapi_metric_set.get('ShortName'))
+                sys.exit(1)
+
+    return regs
+
+
+# We only have a very small number of IDs, but we aren't assuming they
+# start from zero or are contiguous in the MDAPI XML files. Python
+# doesn't seem to have a built in sparse array type so we just
+# loop over the entries we have:
+def get_mux_id_group(id_groups, id):
+    for group in id_groups:
+        if group['id'] == id:
+            return group
+
+    new_group = { 'id': id, 'configs': [] }
+    id_groups.append(new_group)
+
+    return new_group
+
+
+
+def process_mux_configs(mdapi_set):
+    allow_missing_id = True
+
+    mux_config_id_groups = []
+
+    for mdapi_reg_config in mdapi_set.findall("RegConfigStart"):
+
+        mux_regs = []
+        for mdapi_reg in mdapi_reg_config.findall("Register"):
+            address = int(mdapi_reg.get('offset'), 16)
+
+            if address in chipsets[chipset]['config_reg_blacklist']:
+                continue
+
+            reg_type = mdapi_reg.get('type')
+
+            if reg_type not in register_types:
+                print_err("ERROR: unknown register type=\"" + reg_type + "\": MetricSet=\"" + mdapi_set.get('ShortName'))
+                sys.exit(1)
+
+            if reg_type != 'NOA' and reg_type != 'PM':
+                continue
+
+            reg = (address, int(mdapi_reg.get('value'), 16))
+            mux_regs.append(reg)
+
+        if len(mux_regs) == 0:
+            continue
+
+        availability = mdapi_reg_config.get('AvailabilityEquation')
+        if availability == "":
+            availability = None
+
+        if mdapi_reg_config.get('ConfigPriority') != None:
+            reg_config_priority = int(mdapi_reg_config.get('ConfigPriority'))
+        else:
+            reg_config_priority = 0
+
+        if mdapi_reg_config.get('ConfigId') != None:
+            reg_config_id = int(mdapi_reg_config.get('ConfigId'))
+            allow_missing_id = False
+        elif mdapi_reg_config.get('ConfigId') == None and allow_missing_id == True:
+            reg_config_id = 0
+        else:
+            # It will spell trouble if there's a mixture of explicit and
+            # implied config IDs...
+            print_err("ERROR: register configs mixing implied/explicit IDs: MetricSet=\"" + mdapi_set.get('ShortName'))
+            sys.exit(1)
+
+        mux_config = { 'priority': reg_config_priority,
+                       'availability': availability,
+                       'registers': mux_regs }
+
+        mux_config_id_group = get_mux_id_group(mux_config_id_groups, reg_config_id)
+        mux_config_id_group['configs'].append(mux_config)
+
+    mux_config_id_groups.sort(key=itemgetter('id'))
+
+    # The only special case we currently support for more than one group of NOA
+    # MUX configs is for the Broadwell ComputeExtended metric set with two Id
+    # groups and the second just has a single unconditional config that can
+    # logically be appended to all the conditional configs of the first group
+    if len(mux_config_id_groups) > 1:
+        if len(mux_config_id_groups) != 2:
+            print_err("ERROR: Script doesn't currently allow more than two groups of NOA MUX configs for a single metric set: MetricSet=\"" + mdapi_set.get('ShortName'))
+            sys.exit(1)
+
+        last_id_group = mux_config_id_groups[-1]
+        if len(last_id_group['configs']) != 1:
+            print_err("ERROR: Script currently only allows up to two Ids for NOA MUX configs if second Id only contains a single unconditional config: MetricSet=\"" + mdapi_set.get('ShortName'))
+            sys.exit(1)
+
+        tail_config = last_id_group['configs'][0]
+        for mux_config in mux_config_id_groups[0]['configs']:
+            mux_config['registers'] = mux_config['registers'] + tail_config['registers']
+
+        mux_config_id_groups = [mux_config_id_groups[0]]
+
+    if len(mux_config_id_groups) == 0 or mux_config_id_groups[0]['configs'] == 0:
+        print_err("ERROR: MUX register configs missing: MetricSet=\"" + mdapi_set.get('ShortName'))
+        sys.exit(1)
+
+    mux_configs = mux_config_id_groups[0]['configs']
+    assert isinstance(mux_configs, list)
+    assert len(mux_configs) >= 1
+    assert len(mux_configs[0]['registers']) > 1 # > 1 registers
+    return mux_configs
+
+
+def add_register_config(set, priority, availability, regs, type):
+    reg_config = et.SubElement(set, 'register_config')
+
+    reg_config.set('type', type)
+
+    if availability != None:
+        assert type == "NOA"
+        reg_config.set('priority', str(priority))
+        reg_config.set('availability', availability)
+
+    for reg in regs:
+        elem = et.SubElement(reg_config, 'register')
+        elem.set('type', type)
+        elem.set('address', "0x%08X" % reg[0])
+        elem.set('value', "0x%08X" % reg[1])
+
+def to_text(value):
+    if value == None:
+        return ""
+    return value
+
+# There are duplicated metric sets with the same symbol name so we
+# keep track of the sets we've read so we can skip duplicates...
+sets = {}
+
+guids = {}
+
+guids_xml = et.parse(args.guids)
+for guid in guids_xml.findall(".//guid"):
+    hashing_key = oa_registry.Registry.chipset_derive_hash(guid.get('chipset'),
+                                                           guid.get('mdapi_config_hash'))
+    guids[hashing_key] = guid.get('id')
+
+for arg in args.xml:
+    mdapi = et.parse(arg)
+
+    concurrent_group = mdapi.find(".//ConcurrentGroup")
+
+    for mdapi_set in mdapi.findall(".//MetricSet"):
+
+        apis = mdapi_set.get('SupportedAPI')
+        if "OGL" not in apis and "OCL" not in apis and "MEDIA" not in apis:
+            continue
+
+        set_symbol_name = mdapi_set.get('SymbolName')
+
+        if set_symbol_name in sets:
+            print_err("WARNING: duplicate set named \"" + set_symbol_name + "\" (SKIPPING)")
+            continue
+
+        chipset = mdapi_set.get('SupportedHW')
+        if concurrent_group.get('SupportedGT') != None:
+            chipset = chipset + concurrent_group.get('SupportedGT')
+        if chipset not in chipsets:
+            print_err("WARNING: unsupported chipset {0}, consider updating {1}".format(chipset, __file__))
+            continue
+
+        if args.whitelist:
+            set_whitelist = args.whitelist.split()
+            if set_symbol_name not in set_whitelist:
+                continue
+
+        if args.blacklist:
+            set_blacklist = args.blacklist.split()
+        else:
+            set_blacklist = default_set_blacklist
+        if set_symbol_name in set_blacklist:
+            continue
+
+        if mdapi_set.get('SnapshotReportSize') != '256':
+            print_err("WARNING: skipping metric set '{0}', report size {1} invalid".format(set_symbol_name, mdapi_set.get('SnapshotReportSize')))
+            continue
+
+        set = et.SubElement(metrics, 'set')
+
+        set.set('chipset', chipset)
+
+        set.set('name', mdapi_set.get('ShortName'))
+        set.set('symbol_name', set_symbol_name)
+        set.set('underscore_name', underscore(mdapi_set.get('SymbolName')))
+        set.set('mdapi_supported_apis', strip_dx_apis(mdapi_set.get('SupportedAPI')))
+
+
+        # Look at the hardware register config before looking at the counters.
+        #
+        # The hardware configuration is used as a key to lookup up a GUID which
+        # is used by applications to lookup the corresponding counter
+        # normalization equations.
+        #
+        # We want to skip over any metric sets that don't yet have a registered
+        # GUID in guids.xml.
+
+        # There can be multiple NOA MUX configs, since they may have associated
+        # availability tests to match particular systems.
+        #
+        # Unlike the MDAPI XML files we only support tracking one group of
+        # mutually exclusive MUX configs, whereas the MDAPI XML files
+        # theoretically allow a single metric set to be associated with ordered
+        # groups of mutually exclusive configs. So far there is only one
+        # Broadwell, ComputeExtended metric set which uses this, but that
+        # particular case can be expressed in less general terms.
+        #
+        # Being a bit simpler here should make it easier for downstream tools
+        # to deal with. (At least we got the handling of the Broadwell
+        # ComputeExtended example wrong and it took several email exchanges and
+        # a conference call to confirm how to interpret this case)
+        mux_configs = process_mux_configs(mdapi_set)
+
+        # Unlike for MUX registers, we only expect one set of FLEX/OA
+        # registers per metric set (even though they are sometimes duplicated
+        # between configs in MDAPI XML files.
+        #
+        # This filter function, extracts the register of a certain type but
+        # also double checks that if they are repeated in separate configs that
+        # they don't vary. (Notably the current i915 perf Linux driver would
+        # need some adapting to support multiple OA/FLEX configs with different
+        # availability expressions)
+        #
+        flex_regs = filter_single_config_registers_of_type(mdapi_set, "FLEX")
+        oa_regs = filter_single_config_registers_of_type(mdapi_set, "OA")
+
+
+        # Note: we ignore Perfmon registers
+
+        for mux_config in mux_configs:
+            add_register_config(set, mux_config['priority'], mux_config['availability'], mux_config['registers'], "NOA")
+        if len(oa_regs) > 0:
+            add_register_config(set, 0, None, oa_regs, "OA")
+        if len(flex_regs) > 0:
+            add_register_config(set, 0, None, flex_regs, "FLEX")
+
+        mdapi_hw_config_hash = oa_registry.Registry.mdapi_hw_config_hash(mdapi_set)
+        guid_hash = oa_registry.Registry.chipset_derive_hash(chipset.lower(),
+                                                             mdapi_hw_config_hash)
+        hw_config_hash = oa_registry.Registry.hw_config_hash(set)
+
+        if guid_hash in guids:
+            set.set('hw_config_guid', guids[guid_hash])
+        else:
+            print_err("WARNING: No GUID found for metric set " + chipset + ", " + set_symbol_name + " (SKIPPING)")
+            print_err("WARNING: If this is a new config add the following to guids.xml:")
+            print_err("<guid config_hash=\"" + hw_config_hash + "\" mdapi_config_hash=\"" + mdapi_hw_config_hash + "\" id=\"" + str(uuid.uuid4()) + "\" chipset=\"" + chipset.lower() + "\" name=\"" + set_symbol_name + "\" />")
+            metrics.remove(set)
+            continue
+
+
+        sets[set_symbol_name] = set
+
+        counters = {}
+        normalization_equations = {}
+        raw_equations = {}
+
+        # Awkwardly we can't assume metrics are in dependency order and have to
+        # sort them manually. We start by associating a list of dependencies with
+        # each counter...
+
+        mdapi_counters = {}
+        mdapi_counter_deps = {}
+
+        for mdapi_counter in mdapi_set.findall("Metrics/Metric"):
+            symbol_name = mdapi_counter.get('SymbolName')
+
+            if symbol_name in counter_blacklist:
+                continue;
+
+            # Have seen at least one MetricSet with a duplicate GpuCoreClocks counter...
+            if symbol_name in mdapi_counters:
+                print_err("WARNING: Skipping duplicate counter \"" + symbol_name + \
+                        "\" in " + set.get('name') + " :: " + mdapi_counter.get('ShortName'))
+                continue;
+
+            deps = []
+            equations = fixup_equation(str(mdapi_counter.get('SnapshotReportReadEquation'))) + " " + \
+                        fixup_equation(str(mdapi_counter.get('SnapshotReportDeltaEquation'))) + " " + \
+                        fixup_equation(str(mdapi_counter.get('DeltaReportReadEquation'))) + " " + \
+                        fixup_equation(str(mdapi_counter.get('NormalizationEquation')))
+            equations = expand_macros(equations)
+            equations = equations.replace('$$', "$")
+            for token in equations.split():
+                if token[0] == '$' and token[1:] not in sys_vars and token[1:] != "Self":
+                    deps.append(token[1:])
+
+            mdapi_counters[symbol_name] = mdapi_counter
+            mdapi_counter_deps[symbol_name] = deps
+
+        sorted_mdapi_counters = sort_counters(mdapi_counters, mdapi_counter_deps)
+
+        for mdapi_counter in sorted_mdapi_counters:
+
+            aliases = mdapi_counter.get('Alias')
+
+            skip_counter = False
+
+            # We don't currently support configuring and reading perfmon registers
+            signal = mdapi_counter.get('SignalName')
+            if signal and "perfmon" in signal:
+                continue;
+
+            # A few things to fixup with this common counter...
+            if mdapi_counter.get('SymbolName') == "AvgGpuCoreFrequencyMHz":
+                # To avoid requiring a special case in tools, add a max value
+                # equation for the gpu frequency...
+                mdapi_counter.set('MaxValueEquation', "$GpuMaxFrequency")
+
+                # Don't include units in the name
+                mdapi_counter.set('SymbolName', "AvgGpuCoreFrequency")
+
+                # Use canonical, first order of magnitude units specifier
+                mdapi_counter.set('MetricUnits', 'Hz')
+                mdapi_counter.set('NormalizationEquation', '$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV')
+                #mdapi_counter.set('DeltaReportReadEquation', '$GpuCoreClocks $GpuTime UDIV')
+
+
+            symbol_name = mdapi_counter.get('SymbolName')
+
+            counter = et.SubElement(set, 'counter')
+            counter.set('name', apply_aliases(mdapi_counter.get('ShortName'), aliases))
+            counter.set('symbol_name', mdapi_counter.get('SymbolName'))
+            counter.set('underscore_name', underscore(mdapi_counter.get('SymbolName')))
+            counter.set('description', apply_aliases(mdapi_counter.get('LongName'), aliases))
+            counter.set('mdapi_group', apply_aliases(to_text(mdapi_counter.get('Group')), aliases))
+            counter.set('mdapi_usage_flags', to_text(mdapi_counter.get('UsageFlags')))
+            counter.set('mdapi_supported_apis', strip_dx_apis(mdapi_counter.get('SupportedAPI')))
+            low = mdapi_counter.get('LowWatermark')
+            if low:
+                counter.set('low_watermark', low)
+            high = to_text(mdapi_counter.get('HighWatermark'))
+            if high:
+                counter.set('high_watermark', high)
+            counter.set('data_type', mdapi_counter.get('ResultType').lower())
+
+            max_eq = fixup_equation(mdapi_counter.get('MaxValueEquation'))
+            if max_eq:
+                counter.set('max_equation', max_eq)
+
+            # XXX Not sure why EU metrics tend to just be bundled under 'gpu'
+            counter.set('mdapi_hw_unit_type', mdapi_counter.get('HWUnitType').lower())
+
+            # There are counters representing cycle counts that have a semantic
+            # type of 'duration' which doesn't seem to make sense...
+            units = mdapi_counter.get('MetricUnits').lower()
+            if units == "cycles":
+                semantic_type = "event"
+            else:
+                semantic_type = mdapi_counter.get('MetricType').lower()
+
+            counter.set('units', units)
+            counter.set('semantic_type', semantic_type)
+
+            # MDAPI MetricSets have 3 different kinds of counter read equations:
+            #
+            # 1) One for reading a raw (unnormalized) value from a hardware report
+            #
+            #       The line between normalized and raw isn't always clear
+            #       as the raw equation may e.g. read and ADD multiple counters
+            #
+            #       Not all counters have a raw equation if they are instead
+            #       derived through $CounterName references to other counters
+            #       in a normalized value equation
+            #
+            # 2) One for reading an unnormalized value from the accumulated 'delta reports'
+            #
+            #       Seems to duplicate the raw equation but with delta report
+            #       offsets and referencing 64bit values
+            #
+            #       The normalized value equations are always based on these
+            #       accumulated delta values
+            #
+            # 3) One for reading a normalized value
+            #
+            #       These may start with a reference to "$Self" which is
+            #       effectively a macro for the above delta report equation
+            #
+            #       If this is missing the delta report equation is effectively
+            #       the normalized equation too
+            #
+            #       XXX: Beware that there are some inconsistent counters that
+            #       have a normalization equation with a $Self reference and a
+            #       raw equation but no delta report equation. This seems
+            #       pretty sketchy, but (at least for 'MEDIA' metrics) we will
+            #       substitute the raw equation for $Self in this case along
+            #       with a warning to double check the results.
+            #
+            # Currently there doesn't appear to be a clear reason to
+            # differentiate these equations and the separation seems to
+            # complicate things for tools wanting to generate code from this
+            # data.
+            #
+            # We instead aim to have one normalized equation per counter that
+            # always reference accumulated counter values.
+
+            # XXX: As a special case, we override the raw and delta report
+            # equations for the GpuTime counters, which seem inconsistent
+            if mdapi_counter.get('SymbolName') == "GpuTime":
+                mdapi_counter.set('SnapshotReportReadEquation', "dw at 0x04 1000000000 UMUL $GpuTimestampFrequency UDIV")
+                mdapi_counter.set('DeltaReportReadEquation', "qw at 0x0 1000000000 UMUL $GpuTimestampFrequency UDIV")
+
+            availability = fixup_equation(mdapi_counter.get('AvailabilityEquation'))
+            if availability == "":
+                availability = None
+
+            # We prefer to only look at the equations that reference the raw
+            # reports since the mapping of offsets back to A,B,C counters is
+            # unambiguous, but if necessary we will fallback to mapping
+            # delta report offsets (accumulated 64bit values that correspond
+            # to the 32bit or 40bit values from raw repots)
+
+            raw_read_eq = fixup_equation(mdapi_counter.get('SnapshotReportReadEquation'))
+            if raw_read_eq:
+                if raw_read_eq == "":
+                    raw_read_eq = None
+                else:
+                    raw_read_eq = replace_read_tokens_with_rpn_read_ops(chipset,
+                                                                        raw_read_eq,
+                                                                        True) #raw offsets
+
+            delta_read_eq = fixup_equation(mdapi_counter.get('DeltaReportReadEquation'))
+            if delta_read_eq:
+                if delta_read_eq == "":
+                    delta_read_eq = None
+                else:
+                    delta_read_eq = replace_read_tokens_with_rpn_read_ops(chipset,
+                                                                          delta_read_eq,
+                                                                          False) #delta offsets
+
+            if raw_read_eq and not delta_read_eq:
+                print_err("WARNING: Counter with raw equation but no delta report equation: MetricSet=\"" + \
+                          mdapi_set.get('ShortName') + "\" Metric=\"" + mdapi_counter.get('SymbolName') + \
+                          "(" + mdapi_counter.get('ShortName') + ")" + "\"")
+                # Media metric counters currently have no delta equation even
+                # though they have normalization equations that reference $Self
+                if "MEDIA" in apis:
+                    print_err("WARNING: -> Treating inconsistent media metric's 'raw' equation as a 'delta report' equation, but results should be double checked!")
+                    delta_read_eq = raw_read_eq
+                else:
+                    set.remove(counter)
+                    continue
+
+            # Some counters are sourced from register values that are
+            # not put into the OA reports. This is why some counters
+            # will have a delta equation but not a raw equation. These
+            # counters are typically only available in query mode. For
+            # this reason we put a particular availability value.
+            if delta_read_eq and not raw_read_eq:
+                assert availability == None
+                availability = "true $QueryMode &&"
+                raw_read_eq = delta_read_eq
+
+            # After replacing read tokens with RPN counter READ ops the raw and
+            # delta equations are expected to be identical so warn if that's
+            # not true...
+            if bool(raw_read_eq) ^ bool(delta_read_eq) or raw_read_eq != delta_read_eq:
+                print_err("WARNING: Inconsistent raw and delta report equations for " + \
+                          mdapi_set.get('ShortName') + " :: " + mdapi_counter.get('SymbolName') + \
+                          "(" + mdapi_counter.get('ShortName') + ")" + ": raw=\"" + str(raw_read_eq) + \
+                          "\" delta=\"" + str(delta_read_eq) + "\" (SKIPPING)")
+                set.remove(counter)
+                continue
+
+            normalize_eq = fixup_equation(mdapi_counter.get('NormalizationEquation'))
+            if normalize_eq and normalize_eq == "":
+                normalize_eq = None
+
+            if normalize_eq:
+                # Some normalization equations are represented with macros such as
+                # 'GpuDuration' corresponding to:
+                #
+                #   "$Self 100 UMUL $GpuCoreClocks FDIV"
+                #
+                # We expand macros here so tools don't need to care about them...
+                #
+                equation = normalize_eq
+                equation = expand_macros(equation)
+                if raw_read_eq:
+                    equation = equation.replace('$Self', raw_read_eq)
+            else:
+                equation = delta_read_eq
+
+            if '$Self' in equation:
+                print_err("WARNING: Counter equation (\"" + equation + "\") with unexpanded $Self token: MetricSet=\"" + \
+                          mdapi_set.get('ShortName') + "\" Metric=\"" + mdapi_counter.get('SymbolName') + \
+                          "(" + mdapi_counter.get('ShortName') + ")" + "\" (SKIPPING)")
+                set.remove(counter)
+                continue
+
+            # $$CounterName vs $CounterName in an equation is intended to
+            # differentiate referencing the normalized or raw value of another
+            # counter.
+            #
+            # Since we are only keeping a single (normalized) equation for
+            # counters we only need one form, but we want to be careful to
+            # check if any equations really depend on the raw value of another
+            # counter so we can expand those variables now
+            #
+            tmp = equation
+            for token in tmp.split():
+                if token[0] == '$' and token[1] != '$':
+                    if token[1:] in normalization_equations:
+                        raw_eq = raw_equations[token[1:]]
+
+                        equation = equation.replace(token, raw_eq)
+                        #if token[1:] not in raw_equations:
+                        #   print_err("WARNING: Counter equation (\"" + equation + "\") references un-kept raw equation of another counter : MetricSet=\"" + \
+                        #             mdapi_set.get('ShortName') + "\" Metric=\"" + mdapi_counter.get('ShortName') + "\"")
+
+                    elif token[1:] not in raw_equations and token[1:] not in sys_vars:
+                        print_err("Unknown variable name: \"" + token + "\" in equation \"" + equation + "\"")
+
+            symbol_name = counter.get('symbol_name')
+
+            # Make sure that every variable in the equation is a known sys_var or counter name
+            equation = equation.replace('$$', "$")
+            for token in equation.split():
+                if token[0] == '$':
+                    if token[1:] not in counters and token[1:] not in sys_vars:
+                        print_err("WARNING: Counter equation (\"" + equation + "\") with unknown variable " + \
+                                  token + " (maybe skipped counter): MetricSet=\"" + mdapi_set.get('ShortName') + \
+                                  "\" Metric=\"" + mdapi_counter.get('SymbolName') + "(" + mdapi_counter.get('ShortName') + \
+                                  ")" + "\" (SKIPPING)")
+                        set.remove(counter)
+                        skip_counter = True
+                        break
+
+            if skip_counter:
+                continue
+
+            counter.set('equation', equation.strip())
+
+            if availability != None:
+                counter.set('availability', availability)
+
+            counters[symbol_name] = counter;
+            if normalize_eq:
+                normalization_equations[symbol_name] = normalize_eq
+            if raw_read_eq:
+                raw_equations[symbol_name] = raw_read_eq
+
+
+if args.dry_run:
+    sys.exit(0)
+
+# Merge in any custom meta data we have...
+if args.merge:
+    merge = et.parse(args.merge)
+    merge_metrics = merge.getroot()
+
+    for merge_set in merge.findall(".//set"):
+        pattern = ".//set[@symbol_name=\"" + merge_set.get('symbol_name') + "\"][@chipset=\"" + merge_set.get('chipset') + "\"]"
+        real_set = metrics.find(pattern)
+        if real_set is not None:
+            for set_attr in merge_set.items():
+                real_set.set(set_attr[0], set_attr[1])
+
+            for merge_elem in merge_set:
+                if merge_elem.tag == "counter":
+                    merge_counter = merge_elem
+                    pattern = "counter[@symbol_name=\"" + merge_counter.get('symbol_name') + "\"]"
+                    real_counter = real_set.find(pattern)
+                    if real_counter is not None:
+                        for counter_attr in merge_counter.items():
+                            real_counter.set(counter_attr[0], counter_attr[1])
+                    else:
+                        real_set.append(merge_counter)
+                        real_counter = merge_counter
+                else:
+                    real_set.append(merge_elem)
+
+    # For consistency + readability print everything manually...
+    merge_md5 = hashlib.md5(open("merge.xml", 'rb').read()).hexdigest()
+else:
+    merge_md5 = ""
+
+print ("<?xml version=\"1.0\"?>")
+print("<metrics version=\"" + str(int(time.time())) + "\" merge_md5=\"" + merge_md5 + "\">")
+for set in metrics.findall(".//set"):
+    print("  <set name=\"" + set.get('name') + "\"")
+    del set.attrib['name']
+    for attr in set.items():
+        print("       " + attr[0] + "=\"" + attr[1] + "\"")
+    print("       >")
+    for counter in set.findall("counter"):
+        print("    <counter name=\"" + counter.get('name') + "\"")
+        del counter.attrib['name']
+        for attr in counter.items():
+            if attr[0][:6] != "mdapi_":
+                print("             " + attr[0] + "=\"" + saxutils.escape(attr[1]) + "\"")
+        for attr in counter.items():
+            if attr[0][:6] == "mdapi_":
+                print("             " + attr[0] + "=\"" + saxutils.escape(attr[1]) + "\"")
+        print("             />")
+    for config in set.findall("register_config"):
+        if config.get('availability') != None:
+            print("    <register_config type=\"" + config.get('type') + "\"")
+            print("                     availability=\"" + saxutils.escape(config.get('availability')) + "\"")
+            print("                     priority=\"" + config.get('priority') + "\"")
+            print("                     >")
+        else:
+            print("    <register_config type=\"" + config.get('type') + "\">")
+        for reg in config.findall("register"):
+            addr = int(reg.get('address'), 16)
+
+            if 'registers' in chipsets[chipset] and addr in chipsets[chipset]['registers']:
+                reg_info = chipsets[chipset]['registers'][addr]
+                comment = ' <!--' + reg_info['name'] + ' -->'
+            else:
+                comment = ''
+
+            print("        <register type=\"" + reg.get('type') + "\" address=\"" + reg.get('address') + "\" value=\"" + reg.get('value') + "\" />" + comment)
+        print("    </register_config>")
+    print("  </set>\n")
+print("</metrics>")
diff --git a/lib/i915/perf-configs/oa-bdw.xml b/lib/i915/perf-configs/oa-bdw.xml
new file mode 100644
index 00000000..3cd833c3
--- /dev/null
+++ b/lib/i915/perf-configs/oa-bdw.xml
@@ -0,0 +1,15653 @@
+<?xml version="1.0"?>
+<metrics version="1581935518" merge_md5="">
+  <set name="Render Metrics Basic Gen8"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="render_basic"
+       hw_config_guid="b541bd57-0e0f-4154-b4c0-5858010a2bf7"
+       chipset="BDW"
+       symbol_name="RenderBasic"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Misses"
+             description="The total number of L3 misses."
+             data_type="uint64"
+             equation="C 4 READ"
+             underscore_name="l3_misses"
+             units="messages"
+             symbol_name="L3Misses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/TAG"
+             />
+    <counter name="GTI L3 Throughput"
+             description="The total number of GPU memory bytes transferred between L3 caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="$L3Misses 64 UMUL"
+             underscore_name="gti_l3_throughput"
+             units="bytes"
+             symbol_name="GtiL3Throughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Cache Misses"
+             description="The total number of sampler cache misses in all LODs in all sampler units."
+             data_type="uint64"
+             equation="B 4 READ B 5 READ UADD 8 UMUL"
+             underscore_name="sampler_l1_misses"
+             units="messages"
+             symbol_name="SamplerL1Misses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler 1 Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which Sampler 1 has been slowing down the pipe when processing EU requests."
+             data_type="float"
+             high_watermark="15"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="sampler1_bottleneck"
+             units="percent"
+             symbol_name="Sampler1Bottleneck"
+             availability="$SubsliceMask 0x12 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="L3 Sampler Throughput"
+             description="The total number of GPU memory bytes transferred between samplers and L3 caches."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="$SamplerL1Misses 64 UMUL"
+             underscore_name="l3_sampler_throughput"
+             units="bytes"
+             symbol_name="L3SamplerThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Sampler"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Sampler 0 Busy"
+             description="The percentage of time in which Sampler 0 has been processing EU requests."
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler0_busy"
+             units="percent"
+             symbol_name="Sampler0Busy"
+             availability="$SubsliceMask 0x09 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Sampler 1 Busy"
+             description="The percentage of time in which Sampler 1 has been processing EU requests."
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler1_busy"
+             units="percent"
+             symbol_name="Sampler1Busy"
+             availability="$SubsliceMask 0x12 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Samplers Busy"
+             description="The percentage of time in which samplers have been processing EU requests."
+             data_type="float"
+             max_equation="100"
+             equation="$Sampler0Busy $Sampler1Busy FMAX"
+             underscore_name="samplers_busy"
+             units="percent"
+             symbol_name="SamplersBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="GTI Fixed Pipe Throughput"
+             description="The total number of GPU memory bytes transferred between 3D Pipeline (Command Dispatch, Input Assembly and Stream Output) and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="B 6 READ B 7 READ UADD 64 UMUL"
+             underscore_name="gti_vf_throughput"
+             units="bytes"
+             symbol_name="GtiVfThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/3D Pipe"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler 0 Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which Sampler 0 has been slowing down the pipe when processing EU requests."
+             data_type="float"
+             high_watermark="15"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="sampler0_bottleneck"
+             units="percent"
+             symbol_name="Sampler0Bottleneck"
+             availability="$SubsliceMask 0x09 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="L3 Lookup Accesses w/o IC"
+             description="The total number of L3 cache lookup accesses w/o IC."
+             data_type="uint64"
+             equation="$SamplerL1Misses $ShaderMemoryAccesses UADD"
+             underscore_name="l3_lookups"
+             units="messages"
+             symbol_name="L3Lookups"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/TAG"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Read Throughput"
+             description="The total number of GPU memory bytes read from GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="C 6 READ 64 UMUL"
+             underscore_name="gti_read_throughput"
+             units="bytes"
+             symbol_name="GtiReadThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Depth Throughput"
+             description="The total number of GPU memory bytes transferred between depth caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 0 READ C 1 READ UADD 64 UMUL"
+             underscore_name="gti_depth_throughput"
+             units="bytes"
+             symbol_name="GtiDepthThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/Depth Cache"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Samplers Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which samplers have been slowing down the pipe when processing EU requests."
+             data_type="float"
+             high_watermark="15"
+             equation="$Sampler0Bottleneck $Sampler1Bottleneck FMAX"
+             max_equation="100"
+             underscore_name="sampler_bottleneck"
+             units="percent"
+             symbol_name="SamplerBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Indicate System Frame Batch Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="GTI HDC TLB Lookup Throughput"
+             description="The total number of GPU memory bytes transferred between GTI and HDC, when HDC is doing TLB lookups."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 5 READ 64 UMUL"
+             underscore_name="gti_hdc_lookups_throughput"
+             units="bytes"
+             symbol_name="GtiHdcLookupsThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI RCC Throughput"
+             description="The total number of GPU memory bytes transferred between render color caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 2 READ C 3 READ UADD 64 UMUL"
+             underscore_name="gti_rcc_throughput"
+             units="bytes"
+             symbol_name="GtiRccThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/Color Cache"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="GTI Write Throughput"
+             description="The total number of GPU memory bytes written to GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 32 UMUL"
+             equation="C 7 READ 64 UMUL"
+             underscore_name="gti_write_throughput"
+             units="bytes"
+             symbol_name="GtiWriteThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL 2 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses UADD UADD 64 UMUL"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA"
+                     availability="$SliceMask 0x01 AND"
+                     priority="0"
+                     >
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x143F000F" />
+        <register type="NOA" address="0x00009888" value="0x14110014" />
+        <register type="NOA" address="0x00009888" value="0x14310014" />
+        <register type="NOA" address="0x00009888" value="0x14BF000F" />
+        <register type="NOA" address="0x00009888" value="0x118A0317" />
+        <register type="NOA" address="0x00009888" value="0x13837BE0" />
+        <register type="NOA" address="0x00009888" value="0x3B800060" />
+        <register type="NOA" address="0x00009888" value="0x3D800005" />
+        <register type="NOA" address="0x00009888" value="0x005C4000" />
+        <register type="NOA" address="0x00009888" value="0x065C8000" />
+        <register type="NOA" address="0x00009888" value="0x085CC000" />
+        <register type="NOA" address="0x00009888" value="0x003D8000" />
+        <register type="NOA" address="0x00009888" value="0x183D0800" />
+        <register type="NOA" address="0x00009888" value="0x0A3F0023" />
+        <register type="NOA" address="0x00009888" value="0x103F0000" />
+        <register type="NOA" address="0x00009888" value="0x00584000" />
+        <register type="NOA" address="0x00009888" value="0x08584000" />
+        <register type="NOA" address="0x00009888" value="0x0A5A4000" />
+        <register type="NOA" address="0x00009888" value="0x005B4000" />
+        <register type="NOA" address="0x00009888" value="0x0E5B8000" />
+        <register type="NOA" address="0x00009888" value="0x185B2400" />
+        <register type="NOA" address="0x00009888" value="0x0A1D4000" />
+        <register type="NOA" address="0x00009888" value="0x0C1F0800" />
+        <register type="NOA" address="0x00009888" value="0x0E1FAA00" />
+        <register type="NOA" address="0x00009888" value="0x00384000" />
+        <register type="NOA" address="0x00009888" value="0x0E384000" />
+        <register type="NOA" address="0x00009888" value="0x16384000" />
+        <register type="NOA" address="0x00009888" value="0x18380001" />
+        <register type="NOA" address="0x00009888" value="0x00392000" />
+        <register type="NOA" address="0x00009888" value="0x06398000" />
+        <register type="NOA" address="0x00009888" value="0x0839A000" />
+        <register type="NOA" address="0x00009888" value="0x0A391000" />
+        <register type="NOA" address="0x00009888" value="0x00104000" />
+        <register type="NOA" address="0x00009888" value="0x08104000" />
+        <register type="NOA" address="0x00009888" value="0x00110030" />
+        <register type="NOA" address="0x00009888" value="0x08110031" />
+        <register type="NOA" address="0x00009888" value="0x10110000" />
+        <register type="NOA" address="0x00009888" value="0x00134000" />
+        <register type="NOA" address="0x00009888" value="0x16130020" />
+        <register type="NOA" address="0x00009888" value="0x06308000" />
+        <register type="NOA" address="0x00009888" value="0x08308000" />
+        <register type="NOA" address="0x00009888" value="0x06311800" />
+        <register type="NOA" address="0x00009888" value="0x08311880" />
+        <register type="NOA" address="0x00009888" value="0x10310000" />
+        <register type="NOA" address="0x00009888" value="0x0E334000" />
+        <register type="NOA" address="0x00009888" value="0x16330080" />
+        <register type="NOA" address="0x00009888" value="0x0ABF1180" />
+        <register type="NOA" address="0x00009888" value="0x10BF0000" />
+        <register type="NOA" address="0x00009888" value="0x0ADA8000" />
+        <register type="NOA" address="0x00009888" value="0x0A9D8000" />
+        <register type="NOA" address="0x00009888" value="0x109F0002" />
+        <register type="NOA" address="0x00009888" value="0x0AB94000" />
+        <register type="NOA" address="0x00009888" value="0x0D888000" />
+        <register type="NOA" address="0x00009888" value="0x038A0380" />
+        <register type="NOA" address="0x00009888" value="0x058A000E" />
+        <register type="NOA" address="0x00009888" value="0x018A8000" />
+        <register type="NOA" address="0x00009888" value="0x0F8A8000" />
+        <register type="NOA" address="0x00009888" value="0x198A8000" />
+        <register type="NOA" address="0x00009888" value="0x1B8A00A0" />
+        <register type="NOA" address="0x00009888" value="0x078A0000" />
+        <register type="NOA" address="0x00009888" value="0x098A0000" />
+        <register type="NOA" address="0x00009888" value="0x238B2820" />
+        <register type="NOA" address="0x00009888" value="0x258B2550" />
+        <register type="NOA" address="0x00009888" value="0x198C1000" />
+        <register type="NOA" address="0x00009888" value="0x0B8D8000" />
+        <register type="NOA" address="0x00009888" value="0x1F85AA80" />
+        <register type="NOA" address="0x00009888" value="0x2185AAA0" />
+        <register type="NOA" address="0x00009888" value="0x2385002A" />
+        <register type="NOA" address="0x00009888" value="0x0D831021" />
+        <register type="NOA" address="0x00009888" value="0x0F83572F" />
+        <register type="NOA" address="0x00009888" value="0x01835680" />
+        <register type="NOA" address="0x00009888" value="0x0383002C" />
+        <register type="NOA" address="0x00009888" value="0x11830000" />
+        <register type="NOA" address="0x00009888" value="0x19835400" />
+        <register type="NOA" address="0x00009888" value="0x1B830001" />
+        <register type="NOA" address="0x00009888" value="0x05830000" />
+        <register type="NOA" address="0x00009888" value="0x07834000" />
+        <register type="NOA" address="0x00009888" value="0x09834000" />
+        <register type="NOA" address="0x00009888" value="0x0184C000" />
+        <register type="NOA" address="0x00009888" value="0x07848000" />
+        <register type="NOA" address="0x00009888" value="0x0984C000" />
+        <register type="NOA" address="0x00009888" value="0x0B84C000" />
+        <register type="NOA" address="0x00009888" value="0x0D84C000" />
+        <register type="NOA" address="0x00009888" value="0x0F84C000" />
+        <register type="NOA" address="0x00009888" value="0x0384C000" />
+        <register type="NOA" address="0x00009888" value="0x05844000" />
+        <register type="NOA" address="0x00009888" value="0x1B80C137" />
+        <register type="NOA" address="0x00009888" value="0x1D80C147" />
+        <register type="NOA" address="0x00009888" value="0x21800000" />
+        <register type="NOA" address="0x00009888" value="0x1180C000" />
+        <register type="NOA" address="0x00009888" value="0x17808000" />
+        <register type="NOA" address="0x00009888" value="0x1980C000" />
+        <register type="NOA" address="0x00009888" value="0x1F80C000" />
+        <register type="NOA" address="0x00009888" value="0x1380C000" />
+        <register type="NOA" address="0x00009888" value="0x15804000" />
+        <register type="NOA" address="0x00009888" value="0x4D801110" />
+        <register type="NOA" address="0x00009888" value="0x4F800331" />
+        <register type="NOA" address="0x00009888" value="0x43800802" />
+        <register type="NOA" address="0x00009888" value="0x51800000" />
+        <register type="NOA" address="0x00009888" value="0x45801465" />
+        <register type="NOA" address="0x00009888" value="0x53801111" />
+        <register type="NOA" address="0x00009888" value="0x478014A5" />
+        <register type="NOA" address="0x00009888" value="0x31800000" />
+        <register type="NOA" address="0x00009888" value="0x3F800CA5" />
+        <register type="NOA" address="0x00009888" value="0x41800003" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+    </register_config>
+    <register_config type="NOA"
+                     availability="$SliceMask 0x02 AND"
+                     priority="1"
+                     >
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x143F000F" />
+        <register type="NOA" address="0x00009888" value="0x14BF000F" />
+        <register type="NOA" address="0x00009888" value="0x14910014" />
+        <register type="NOA" address="0x00009888" value="0x14B10014" />
+        <register type="NOA" address="0x00009888" value="0x118A0317" />
+        <register type="NOA" address="0x00009888" value="0x13837BE0" />
+        <register type="NOA" address="0x00009888" value="0x3B800060" />
+        <register type="NOA" address="0x00009888" value="0x3D800005" />
+        <register type="NOA" address="0x00009888" value="0x0A3F0023" />
+        <register type="NOA" address="0x00009888" value="0x103F0000" />
+        <register type="NOA" address="0x00009888" value="0x0A5A4000" />
+        <register type="NOA" address="0x00009888" value="0x0A1D4000" />
+        <register type="NOA" address="0x00009888" value="0x0E1F8000" />
+        <register type="NOA" address="0x00009888" value="0x0A391000" />
+        <register type="NOA" address="0x00009888" value="0x00DC4000" />
+        <register type="NOA" address="0x00009888" value="0x06DC8000" />
+        <register type="NOA" address="0x00009888" value="0x08DCC000" />
+        <register type="NOA" address="0x00009888" value="0x00BD8000" />
+        <register type="NOA" address="0x00009888" value="0x18BD0800" />
+        <register type="NOA" address="0x00009888" value="0x0ABF1180" />
+        <register type="NOA" address="0x00009888" value="0x10BF0000" />
+        <register type="NOA" address="0x00009888" value="0x00D84000" />
+        <register type="NOA" address="0x00009888" value="0x08D84000" />
+        <register type="NOA" address="0x00009888" value="0x0ADA8000" />
+        <register type="NOA" address="0x00009888" value="0x00DB4000" />
+        <register type="NOA" address="0x00009888" value="0x0EDB8000" />
+        <register type="NOA" address="0x00009888" value="0x18DB2400" />
+        <register type="NOA" address="0x00009888" value="0x0A9D8000" />
+        <register type="NOA" address="0x00009888" value="0x0C9F0800" />
+        <register type="NOA" address="0x00009888" value="0x0E9F2A00" />
+        <register type="NOA" address="0x00009888" value="0x109F0002" />
+        <register type="NOA" address="0x00009888" value="0x00B84000" />
+        <register type="NOA" address="0x00009888" value="0x0EB84000" />
+        <register type="NOA" address="0x00009888" value="0x16B84000" />
+        <register type="NOA" address="0x00009888" value="0x18B80001" />
+        <register type="NOA" address="0x00009888" value="0x00B92000" />
+        <register type="NOA" address="0x00009888" value="0x06B98000" />
+        <register type="NOA" address="0x00009888" value="0x08B9A000" />
+        <register type="NOA" address="0x00009888" value="0x0AB94000" />
+        <register type="NOA" address="0x00009888" value="0x00904000" />
+        <register type="NOA" address="0x00009888" value="0x08904000" />
+        <register type="NOA" address="0x00009888" value="0x00910030" />
+        <register type="NOA" address="0x00009888" value="0x08910031" />
+        <register type="NOA" address="0x00009888" value="0x10910000" />
+        <register type="NOA" address="0x00009888" value="0x00934000" />
+        <register type="NOA" address="0x00009888" value="0x16930020" />
+        <register type="NOA" address="0x00009888" value="0x06B08000" />
+        <register type="NOA" address="0x00009888" value="0x08B08000" />
+        <register type="NOA" address="0x00009888" value="0x06B11800" />
+        <register type="NOA" address="0x00009888" value="0x08B11880" />
+        <register type="NOA" address="0x00009888" value="0x10B10000" />
+        <register type="NOA" address="0x00009888" value="0x0EB34000" />
+        <register type="NOA" address="0x00009888" value="0x16B30080" />
+        <register type="NOA" address="0x00009888" value="0x01888000" />
+        <register type="NOA" address="0x00009888" value="0x0D88B800" />
+        <register type="NOA" address="0x00009888" value="0x038A0380" />
+        <register type="NOA" address="0x00009888" value="0x058A000E" />
+        <register type="NOA" address="0x00009888" value="0x1B8A0080" />
+        <register type="NOA" address="0x00009888" value="0x078A0000" />
+        <register type="NOA" address="0x00009888" value="0x098A0000" />
+        <register type="NOA" address="0x00009888" value="0x238B2840" />
+        <register type="NOA" address="0x00009888" value="0x258B26A0" />
+        <register type="NOA" address="0x00009888" value="0x018C4000" />
+        <register type="NOA" address="0x00009888" value="0x0F8C4000" />
+        <register type="NOA" address="0x00009888" value="0x178C2000" />
+        <register type="NOA" address="0x00009888" value="0x198C1100" />
+        <register type="NOA" address="0x00009888" value="0x018D2000" />
+        <register type="NOA" address="0x00009888" value="0x078D8000" />
+        <register type="NOA" address="0x00009888" value="0x098DA000" />
+        <register type="NOA" address="0x00009888" value="0x0B8D8000" />
+        <register type="NOA" address="0x00009888" value="0x1F85AA80" />
+        <register type="NOA" address="0x00009888" value="0x2185AAA0" />
+        <register type="NOA" address="0x00009888" value="0x2385002A" />
+        <register type="NOA" address="0x00009888" value="0x0D831021" />
+        <register type="NOA" address="0x00009888" value="0x0F83572F" />
+        <register type="NOA" address="0x00009888" value="0x01835680" />
+        <register type="NOA" address="0x00009888" value="0x0383002C" />
+        <register type="NOA" address="0x00009888" value="0x11830000" />
+        <register type="NOA" address="0x00009888" value="0x19835400" />
+        <register type="NOA" address="0x00009888" value="0x1B830001" />
+        <register type="NOA" address="0x00009888" value="0x05830000" />
+        <register type="NOA" address="0x00009888" value="0x07834000" />
+        <register type="NOA" address="0x00009888" value="0x09834000" />
+        <register type="NOA" address="0x00009888" value="0x0184C000" />
+        <register type="NOA" address="0x00009888" value="0x07848000" />
+        <register type="NOA" address="0x00009888" value="0x0984C000" />
+        <register type="NOA" address="0x00009888" value="0x0B84C000" />
+        <register type="NOA" address="0x00009888" value="0x0D84C000" />
+        <register type="NOA" address="0x00009888" value="0x0F84C000" />
+        <register type="NOA" address="0x00009888" value="0x0384C000" />
+        <register type="NOA" address="0x00009888" value="0x05844000" />
+        <register type="NOA" address="0x00009888" value="0x1B80C137" />
+        <register type="NOA" address="0x00009888" value="0x1D80C147" />
+        <register type="NOA" address="0x00009888" value="0x21800000" />
+        <register type="NOA" address="0x00009888" value="0x1180C000" />
+        <register type="NOA" address="0x00009888" value="0x17808000" />
+        <register type="NOA" address="0x00009888" value="0x1980C000" />
+        <register type="NOA" address="0x00009888" value="0x1F80C000" />
+        <register type="NOA" address="0x00009888" value="0x1380C000" />
+        <register type="NOA" address="0x00009888" value="0x15804000" />
+        <register type="NOA" address="0x00009888" value="0x4D801550" />
+        <register type="NOA" address="0x00009888" value="0x4F800331" />
+        <register type="NOA" address="0x00009888" value="0x43800802" />
+        <register type="NOA" address="0x00009888" value="0x51800400" />
+        <register type="NOA" address="0x00009888" value="0x458004A1" />
+        <register type="NOA" address="0x00009888" value="0x53805555" />
+        <register type="NOA" address="0x00009888" value="0x47800421" />
+        <register type="NOA" address="0x00009888" value="0x31800000" />
+        <register type="NOA" address="0x00009888" value="0x3F801421" />
+        <register type="NOA" address="0x00009888" value="0x41800845" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Compute Metrics Basic Gen8"
+       mdapi_supported_apis="VK OGL4 OCL IO BB"
+       underscore_name="compute_basic"
+       hw_config_guid="35fbc9b2-a891-40a6-a38d-022bb7057552"
+       chipset="BDW"
+       symbol_name="ComputeBasic"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Untyped Bytes Read"
+             description="The total number of typed memory bytes read via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="B 6 READ B 7 READ C 0 READ UADD UADD $EuSlicesTotalCount 64 UMUL UMUL"
+             underscore_name="untyped_bytes_read"
+             units="bytes"
+             symbol_name="UntypedBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Typed Bytes Written"
+             description="The total number of typed memory bytes written via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="B 3 READ B 4 READ B 5 READ UADD UADD $EuSlicesTotalCount 64 UMUL UMUL"
+             underscore_name="typed_bytes_written"
+             units="bytes"
+             symbol_name="TypedBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu0_active"
+             units="percent"
+             symbol_name="Fpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active"
+             units="percent"
+             symbol_name="Fpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU AVG IPC Rate"
+             description="The average rate of IPC calculated for 2 FPU pipelines."
+             data_type="float"
+             max_equation="2"
+             equation="A 9 READ  A 10 READ  A 11 READ UADD  A 9 READ USUB FDIV 1 FADD"
+             underscore_name="eu_avg_ipc_rate"
+             units="number"
+             symbol_name="EuAvgIpcRate"
+             semantic_type="ratio"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Read Throughput"
+             description="The total number of GPU memory bytes read from GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="C 4 READ 64 UMUL"
+             underscore_name="gti_read_throughput"
+             units="bytes"
+             symbol_name="GtiReadThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Untyped Writes"
+             description="The total number of untyped memory bytes written via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 1 READ C 2 READ C 3 READ UADD UADD $EuSlicesTotalCount 64 UMUL UMUL"
+             underscore_name="untyped_bytes_written"
+             units="bytes"
+             symbol_name="UntypedBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="Typed Bytes Read"
+             description="The total number of typed memory bytes read via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="B 0 READ B 1 READ B 2 READ UADD UADD $EuSlicesTotalCount 64 UMUL UMUL"
+             underscore_name="typed_bytes_read"
+             units="bytes"
+             symbol_name="TypedBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="EU Thread Occupancy"
+             description="The percentage of time in which hardware threads occupied EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ 8 UMUL $EuCoresTotalCount UDIV $EuThreadsCount UDIV 100 UMUL  $GpuCoreClocks FDIV"
+             underscore_name="eu_thread_occupancy"
+             units="percent"
+             symbol_name="EuThreadOccupancy"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="GTI Write Throughput"
+             description="The total number of GPU memory bytes written to GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 32 UMUL"
+             equation="C 5 READ 64 UMUL"
+             underscore_name="gti_write_throughput"
+             units="bytes"
+             symbol_name="GtiWriteThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL 2 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses UADD UADD 64 UMUL"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="EU Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_send_active"
+             units="percent"
+             symbol_name="EuSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA"
+                     availability="$SliceMask 0x01 AND"
+                     priority="0"
+                     >
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x105C00E0" />
+        <register type="NOA" address="0x00009888" value="0x105800E0" />
+        <register type="NOA" address="0x00009888" value="0x103800E0" />
+        <register type="NOA" address="0x00009888" value="0x3580001A" />
+        <register type="NOA" address="0x00009888" value="0x3B800060" />
+        <register type="NOA" address="0x00009888" value="0x3D800005" />
+        <register type="NOA" address="0x00009888" value="0x065C2100" />
+        <register type="NOA" address="0x00009888" value="0x0A5C0041" />
+        <register type="NOA" address="0x00009888" value="0x0C5C6600" />
+        <register type="NOA" address="0x00009888" value="0x005C6580" />
+        <register type="NOA" address="0x00009888" value="0x085C8000" />
+        <register type="NOA" address="0x00009888" value="0x0E5C8000" />
+        <register type="NOA" address="0x00009888" value="0x00580042" />
+        <register type="NOA" address="0x00009888" value="0x08582080" />
+        <register type="NOA" address="0x00009888" value="0x0C58004C" />
+        <register type="NOA" address="0x00009888" value="0x0E582580" />
+        <register type="NOA" address="0x00009888" value="0x005B4000" />
+        <register type="NOA" address="0x00009888" value="0x185B1000" />
+        <register type="NOA" address="0x00009888" value="0x1A5B0104" />
+        <register type="NOA" address="0x00009888" value="0x0C1FA800" />
+        <register type="NOA" address="0x00009888" value="0x0E1FAA00" />
+        <register type="NOA" address="0x00009888" value="0x101F02AA" />
+        <register type="NOA" address="0x00009888" value="0x08380042" />
+        <register type="NOA" address="0x00009888" value="0x0A382080" />
+        <register type="NOA" address="0x00009888" value="0x0E38404C" />
+        <register type="NOA" address="0x00009888" value="0x0238404B" />
+        <register type="NOA" address="0x00009888" value="0x00384000" />
+        <register type="NOA" address="0x00009888" value="0x16380000" />
+        <register type="NOA" address="0x00009888" value="0x18381145" />
+        <register type="NOA" address="0x00009888" value="0x04380000" />
+        <register type="NOA" address="0x00009888" value="0x0039A000" />
+        <register type="NOA" address="0x00009888" value="0x06398000" />
+        <register type="NOA" address="0x00009888" value="0x0839A000" />
+        <register type="NOA" address="0x00009888" value="0x0A39A000" />
+        <register type="NOA" address="0x00009888" value="0x0C39A000" />
+        <register type="NOA" address="0x00009888" value="0x0E39A000" />
+        <register type="NOA" address="0x00009888" value="0x02392000" />
+        <register type="NOA" address="0x00009888" value="0x018A8000" />
+        <register type="NOA" address="0x00009888" value="0x0F8A8000" />
+        <register type="NOA" address="0x00009888" value="0x198A8000" />
+        <register type="NOA" address="0x00009888" value="0x1B8AAAA0" />
+        <register type="NOA" address="0x00009888" value="0x1D8A0002" />
+        <register type="NOA" address="0x00009888" value="0x038A8000" />
+        <register type="NOA" address="0x00009888" value="0x058A8000" />
+        <register type="NOA" address="0x00009888" value="0x238B02A0" />
+        <register type="NOA" address="0x00009888" value="0x258B5550" />
+        <register type="NOA" address="0x00009888" value="0x278B0015" />
+        <register type="NOA" address="0x00009888" value="0x1F850A80" />
+        <register type="NOA" address="0x00009888" value="0x2185AAA0" />
+        <register type="NOA" address="0x00009888" value="0x2385002A" />
+        <register type="NOA" address="0x00009888" value="0x01834000" />
+        <register type="NOA" address="0x00009888" value="0x0F834000" />
+        <register type="NOA" address="0x00009888" value="0x19835400" />
+        <register type="NOA" address="0x00009888" value="0x1B830155" />
+        <register type="NOA" address="0x00009888" value="0x03834000" />
+        <register type="NOA" address="0x00009888" value="0x05834000" />
+        <register type="NOA" address="0x00009888" value="0x0184C000" />
+        <register type="NOA" address="0x00009888" value="0x07848000" />
+        <register type="NOA" address="0x00009888" value="0x0984C000" />
+        <register type="NOA" address="0x00009888" value="0x0B84C000" />
+        <register type="NOA" address="0x00009888" value="0x0D84C000" />
+        <register type="NOA" address="0x00009888" value="0x0F84C000" />
+        <register type="NOA" address="0x00009888" value="0x03844000" />
+        <register type="NOA" address="0x00009888" value="0x17808137" />
+        <register type="NOA" address="0x00009888" value="0x1980C147" />
+        <register type="NOA" address="0x00009888" value="0x1B80C0E5" />
+        <register type="NOA" address="0x00009888" value="0x1D80C0E3" />
+        <register type="NOA" address="0x00009888" value="0x21800000" />
+        <register type="NOA" address="0x00009888" value="0x1180C000" />
+        <register type="NOA" address="0x00009888" value="0x1F80C000" />
+        <register type="NOA" address="0x00009888" value="0x13804000" />
+        <register type="NOA" address="0x00009888" value="0x15800000" />
+        <register type="NOA" address="0x00000D24" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x4D801000" />
+        <register type="NOA" address="0x00009888" value="0x4F800111" />
+        <register type="NOA" address="0x00009888" value="0x43800062" />
+        <register type="NOA" address="0x00009888" value="0x51800000" />
+        <register type="NOA" address="0x00009888" value="0x45800062" />
+        <register type="NOA" address="0x00009888" value="0x53800000" />
+        <register type="NOA" address="0x00009888" value="0x47800062" />
+        <register type="NOA" address="0x00009888" value="0x31800000" />
+        <register type="NOA" address="0x00009888" value="0x3F801062" />
+        <register type="NOA" address="0x00009888" value="0x41801084" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+    </register_config>
+    <register_config type="NOA"
+                     availability="$SliceMask 0x02 AND"
+                     priority="2"
+                     >
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x10DC00E0" />
+        <register type="NOA" address="0x00009888" value="0x10D800E0" />
+        <register type="NOA" address="0x00009888" value="0x10B800E0" />
+        <register type="NOA" address="0x00009888" value="0x3580001A" />
+        <register type="NOA" address="0x00009888" value="0x3B800060" />
+        <register type="NOA" address="0x00009888" value="0x3D800005" />
+        <register type="NOA" address="0x00009888" value="0x06DC2100" />
+        <register type="NOA" address="0x00009888" value="0x0ADC0041" />
+        <register type="NOA" address="0x00009888" value="0x0CDC6600" />
+        <register type="NOA" address="0x00009888" value="0x00DC6580" />
+        <register type="NOA" address="0x00009888" value="0x08DC8000" />
+        <register type="NOA" address="0x00009888" value="0x0EDC8000" />
+        <register type="NOA" address="0x00009888" value="0x00D80042" />
+        <register type="NOA" address="0x00009888" value="0x08D82080" />
+        <register type="NOA" address="0x00009888" value="0x0CD8004C" />
+        <register type="NOA" address="0x00009888" value="0x0ED82580" />
+        <register type="NOA" address="0x00009888" value="0x00DB4000" />
+        <register type="NOA" address="0x00009888" value="0x18DB1000" />
+        <register type="NOA" address="0x00009888" value="0x1ADB0104" />
+        <register type="NOA" address="0x00009888" value="0x0C9FA800" />
+        <register type="NOA" address="0x00009888" value="0x0E9FAA00" />
+        <register type="NOA" address="0x00009888" value="0x109F02AA" />
+        <register type="NOA" address="0x00009888" value="0x08B80042" />
+        <register type="NOA" address="0x00009888" value="0x0AB82080" />
+        <register type="NOA" address="0x00009888" value="0x0EB8404C" />
+        <register type="NOA" address="0x00009888" value="0x02B8404B" />
+        <register type="NOA" address="0x00009888" value="0x00B84000" />
+        <register type="NOA" address="0x00009888" value="0x16B80000" />
+        <register type="NOA" address="0x00009888" value="0x18B81145" />
+        <register type="NOA" address="0x00009888" value="0x04B80000" />
+        <register type="NOA" address="0x00009888" value="0x00B9A000" />
+        <register type="NOA" address="0x00009888" value="0x06B98000" />
+        <register type="NOA" address="0x00009888" value="0x08B9A000" />
+        <register type="NOA" address="0x00009888" value="0x0AB9A000" />
+        <register type="NOA" address="0x00009888" value="0x0CB9A000" />
+        <register type="NOA" address="0x00009888" value="0x0EB9A000" />
+        <register type="NOA" address="0x00009888" value="0x02B92000" />
+        <register type="NOA" address="0x00009888" value="0x01888000" />
+        <register type="NOA" address="0x00009888" value="0x0D88F800" />
+        <register type="NOA" address="0x00009888" value="0x0F88000F" />
+        <register type="NOA" address="0x00009888" value="0x03888000" />
+        <register type="NOA" address="0x00009888" value="0x05888000" />
+        <register type="NOA" address="0x00009888" value="0x238B0540" />
+        <register type="NOA" address="0x00009888" value="0x258BAAA0" />
+        <register type="NOA" address="0x00009888" value="0x278B002A" />
+        <register type="NOA" address="0x00009888" value="0x018C4000" />
+        <register type="NOA" address="0x00009888" value="0x0F8C4000" />
+        <register type="NOA" address="0x00009888" value="0x178C2000" />
+        <register type="NOA" address="0x00009888" value="0x198C5500" />
+        <register type="NOA" address="0x00009888" value="0x1B8C0015" />
+        <register type="NOA" address="0x00009888" value="0x038C4000" />
+        <register type="NOA" address="0x00009888" value="0x058C4000" />
+        <register type="NOA" address="0x00009888" value="0x018DA000" />
+        <register type="NOA" address="0x00009888" value="0x078D8000" />
+        <register type="NOA" address="0x00009888" value="0x098DA000" />
+        <register type="NOA" address="0x00009888" value="0x0B8DA000" />
+        <register type="NOA" address="0x00009888" value="0x0D8DA000" />
+        <register type="NOA" address="0x00009888" value="0x0F8DA000" />
+        <register type="NOA" address="0x00009888" value="0x038D2000" />
+        <register type="NOA" address="0x00009888" value="0x1F850A80" />
+        <register type="NOA" address="0x00009888" value="0x2185AAA0" />
+        <register type="NOA" address="0x00009888" value="0x2385002A" />
+        <register type="NOA" address="0x00009888" value="0x01834000" />
+        <register type="NOA" address="0x00009888" value="0x0F834000" />
+        <register type="NOA" address="0x00009888" value="0x19835400" />
+        <register type="NOA" address="0x00009888" value="0x1B830155" />
+        <register type="NOA" address="0x00009888" value="0x03834000" />
+        <register type="NOA" address="0x00009888" value="0x05834000" />
+        <register type="NOA" address="0x00009888" value="0x0184C000" />
+        <register type="NOA" address="0x00009888" value="0x07848000" />
+        <register type="NOA" address="0x00009888" value="0x0984C000" />
+        <register type="NOA" address="0x00009888" value="0x0B84C000" />
+        <register type="NOA" address="0x00009888" value="0x0D84C000" />
+        <register type="NOA" address="0x00009888" value="0x0F84C000" />
+        <register type="NOA" address="0x00009888" value="0x03844000" />
+        <register type="NOA" address="0x00009888" value="0x17808137" />
+        <register type="NOA" address="0x00009888" value="0x1980C147" />
+        <register type="NOA" address="0x00009888" value="0x1B80C0E5" />
+        <register type="NOA" address="0x00009888" value="0x1D80C0E3" />
+        <register type="NOA" address="0x00009888" value="0x21800000" />
+        <register type="NOA" address="0x00009888" value="0x1180C000" />
+        <register type="NOA" address="0x00009888" value="0x1F80C000" />
+        <register type="NOA" address="0x00009888" value="0x13804000" />
+        <register type="NOA" address="0x00009888" value="0x15800000" />
+        <register type="NOA" address="0x00000D24" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x4D805000" />
+        <register type="NOA" address="0x00009888" value="0x4F800555" />
+        <register type="NOA" address="0x00009888" value="0x43800062" />
+        <register type="NOA" address="0x00009888" value="0x51800000" />
+        <register type="NOA" address="0x00009888" value="0x45800062" />
+        <register type="NOA" address="0x00009888" value="0x53800000" />
+        <register type="NOA" address="0x00009888" value="0x47800062" />
+        <register type="NOA" address="0x00009888" value="0x31800000" />
+        <register type="NOA" address="0x00009888" value="0x3F800062" />
+        <register type="NOA" address="0x00009888" value="0x41800000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00000003" />
+        <register type="FLEX" address="0x0000E658" value="0x00002001" />
+        <register type="FLEX" address="0x0000E758" value="0x00778008" />
+        <register type="FLEX" address="0x0000E45C" value="0x00088078" />
+        <register type="FLEX" address="0x0000E55C" value="0x00808708" />
+        <register type="FLEX" address="0x0000E65C" value="0x00A08908" />
+    </register_config>
+  </set>
+
+  <set name="Render Metrics for 3D Pipeline Profile"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="render_pipe_profile"
+       hw_config_guid="233d0544-fff7-4281-8291-e02f222aff72"
+       chipset="BDW"
+       symbol_name="RenderPipeProfile"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Bottleneck"
+             low_watermark="10"
+             description="The percentage of time in which vertex shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="30"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_bottleneck"
+             units="percent"
+             symbol_name="VsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Hi-Depth Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which early hierarchical depth test pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="hi_depth_bottleneck"
+             units="percent"
+             symbol_name="HiDepthBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which geometry shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gs_bottleneck"
+             units="percent"
+             symbol_name="GsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Geometry Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="BC Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which barycentric coordinates calculation pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="bc_bottleneck"
+             units="percent"
+             symbol_name="BcBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Barycentric Calc"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HS Stall"
+             description="The percentage of time in which hull stall pipeline stage was stalled."
+             data_type="float"
+             equation="C 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="hs_stall"
+             units="percent"
+             symbol_name="HsStall"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Hull Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="VF Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which vertex fetch pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="C 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vf_bottleneck"
+             units="percent"
+             symbol_name="VfBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Input Assembler"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Strip-Fans Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which strip-fans pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="10"
+             equation="B 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sf_bottleneck"
+             units="percent"
+             symbol_name="SfBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Strip-Fans"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Accesses"
+             description="The total number of messages send to samplers."
+             data_type="uint64"
+             equation="A 28 READ"
+             underscore_name="sampler_accesses"
+             units="messages"
+             symbol_name="SamplerAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler"
+             />
+    <counter name="SF Stall"
+             description="The percentage of time in which strip-fans pipeline stage was stalled."
+             data_type="float"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sf_stall"
+             units="percent"
+             symbol_name="SfStall"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Strip-Fans"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HS Bottleneck"
+             low_watermark="3"
+             description="The percentage of time in which hull shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="9"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="hs_bottleneck"
+             units="percent"
+             symbol_name="HsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Hull Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="CL Stall"
+             description="The percentage of time in which clipper pipeline stage was stalled."
+             data_type="float"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="cl_stall"
+             units="percent"
+             symbol_name="ClStall"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Clipper"
+             />
+    <counter name="SO Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which stream output pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="so_bottleneck"
+             units="percent"
+             symbol_name="SoBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Stream Output"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="DS Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which domain shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ds_bottleneck"
+             units="percent"
+             symbol_name="DsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Domain Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Clipper Bottleneck"
+             low_watermark="10"
+             description="The percentage of time in which clipper pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="30"
+             equation="B 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="cl_bottleneck"
+             units="percent"
+             symbol_name="ClBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Clipper"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Stall"
+             description="The percentage of time in which domain shader pipeline stage was stalled."
+             data_type="float"
+             equation="C 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ds_stall"
+             units="percent"
+             symbol_name="DsStall"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Domain Shader"
+             />
+    <counter name="Early Depth Bottleneck"
+             low_watermark="10"
+             description="The percentage of time in which early depth test pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="30"
+             equation="B 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="early_depth_bottleneck"
+             units="percent"
+             symbol_name="EarlyDepthBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL 2 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses UADD UADD 64 UMUL"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="SO Stall"
+             description="The percentage of time in which stream-output pipeline stage was stalled."
+             data_type="float"
+             equation="C 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="so_stall"
+             units="percent"
+             symbol_name="SoStall"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Stream Output"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x0A1E0000" />
+        <register type="NOA" address="0x00009888" value="0x0C1F000F" />
+        <register type="NOA" address="0x00009888" value="0x10176800" />
+        <register type="NOA" address="0x00009888" value="0x1191001F" />
+        <register type="NOA" address="0x00009888" value="0x0B880320" />
+        <register type="NOA" address="0x00009888" value="0x01890C40" />
+        <register type="NOA" address="0x00009888" value="0x118A1C00" />
+        <register type="NOA" address="0x00009888" value="0x118D7C00" />
+        <register type="NOA" address="0x00009888" value="0x118E0020" />
+        <register type="NOA" address="0x00009888" value="0x118F4C00" />
+        <register type="NOA" address="0x00009888" value="0x11900000" />
+        <register type="NOA" address="0x00009888" value="0x13900001" />
+        <register type="NOA" address="0x00009888" value="0x065C4000" />
+        <register type="NOA" address="0x00009888" value="0x0C3D8000" />
+        <register type="NOA" address="0x00009888" value="0x06584000" />
+        <register type="NOA" address="0x00009888" value="0x0C5B4000" />
+        <register type="NOA" address="0x00009888" value="0x081E0040" />
+        <register type="NOA" address="0x00009888" value="0x0E1E0000" />
+        <register type="NOA" address="0x00009888" value="0x021F5400" />
+        <register type="NOA" address="0x00009888" value="0x001F0000" />
+        <register type="NOA" address="0x00009888" value="0x101F0010" />
+        <register type="NOA" address="0x00009888" value="0x0E1F0080" />
+        <register type="NOA" address="0x00009888" value="0x0C384000" />
+        <register type="NOA" address="0x00009888" value="0x06392000" />
+        <register type="NOA" address="0x00009888" value="0x0C13C000" />
+        <register type="NOA" address="0x00009888" value="0x06164000" />
+        <register type="NOA" address="0x00009888" value="0x06170012" />
+        <register type="NOA" address="0x00009888" value="0x00170000" />
+        <register type="NOA" address="0x00009888" value="0x01910005" />
+        <register type="NOA" address="0x00009888" value="0x07880002" />
+        <register type="NOA" address="0x00009888" value="0x01880C00" />
+        <register type="NOA" address="0x00009888" value="0x0F880000" />
+        <register type="NOA" address="0x00009888" value="0x0D880000" />
+        <register type="NOA" address="0x00009888" value="0x05880000" />
+        <register type="NOA" address="0x00009888" value="0x09890032" />
+        <register type="NOA" address="0x00009888" value="0x078A0800" />
+        <register type="NOA" address="0x00009888" value="0x0F8A0A00" />
+        <register type="NOA" address="0x00009888" value="0x198A4000" />
+        <register type="NOA" address="0x00009888" value="0x1B8A2000" />
+        <register type="NOA" address="0x00009888" value="0x1D8A0000" />
+        <register type="NOA" address="0x00009888" value="0x038A4000" />
+        <register type="NOA" address="0x00009888" value="0x0B8A8000" />
+        <register type="NOA" address="0x00009888" value="0x0D8A8000" />
+        <register type="NOA" address="0x00009888" value="0x238B54C0" />
+        <register type="NOA" address="0x00009888" value="0x258BAA55" />
+        <register type="NOA" address="0x00009888" value="0x278B0019" />
+        <register type="NOA" address="0x00009888" value="0x198C0100" />
+        <register type="NOA" address="0x00009888" value="0x058C4000" />
+        <register type="NOA" address="0x00009888" value="0x0F8D0015" />
+        <register type="NOA" address="0x00009888" value="0x018D1000" />
+        <register type="NOA" address="0x00009888" value="0x098D8000" />
+        <register type="NOA" address="0x00009888" value="0x0B8DF000" />
+        <register type="NOA" address="0x00009888" value="0x0D8D3000" />
+        <register type="NOA" address="0x00009888" value="0x038DE000" />
+        <register type="NOA" address="0x00009888" value="0x058D3000" />
+        <register type="NOA" address="0x00009888" value="0x0D8E0004" />
+        <register type="NOA" address="0x00009888" value="0x058E000C" />
+        <register type="NOA" address="0x00009888" value="0x098E0000" />
+        <register type="NOA" address="0x00009888" value="0x078E0000" />
+        <register type="NOA" address="0x00009888" value="0x038E0000" />
+        <register type="NOA" address="0x00009888" value="0x0B8F0020" />
+        <register type="NOA" address="0x00009888" value="0x198F0C00" />
+        <register type="NOA" address="0x00009888" value="0x078F8000" />
+        <register type="NOA" address="0x00009888" value="0x098F4000" />
+        <register type="NOA" address="0x00009888" value="0x0B900980" />
+        <register type="NOA" address="0x00009888" value="0x03900D80" />
+        <register type="NOA" address="0x00009888" value="0x01900000" />
+        <register type="NOA" address="0x00009888" value="0x1F85AA80" />
+        <register type="NOA" address="0x00009888" value="0x2185AAAA" />
+        <register type="NOA" address="0x00009888" value="0x2385002A" />
+        <register type="NOA" address="0x00009888" value="0x01834000" />
+        <register type="NOA" address="0x00009888" value="0x0F834000" />
+        <register type="NOA" address="0x00009888" value="0x19835400" />
+        <register type="NOA" address="0x00009888" value="0x1B830155" />
+        <register type="NOA" address="0x00009888" value="0x03834000" />
+        <register type="NOA" address="0x00009888" value="0x05834000" />
+        <register type="NOA" address="0x00009888" value="0x07834000" />
+        <register type="NOA" address="0x00009888" value="0x09834000" />
+        <register type="NOA" address="0x00009888" value="0x0B834000" />
+        <register type="NOA" address="0x00009888" value="0x0D834000" />
+        <register type="NOA" address="0x00009888" value="0x0184C000" />
+        <register type="NOA" address="0x00009888" value="0x0784C000" />
+        <register type="NOA" address="0x00009888" value="0x0984C000" />
+        <register type="NOA" address="0x00009888" value="0x0B84C000" />
+        <register type="NOA" address="0x00009888" value="0x0D84C000" />
+        <register type="NOA" address="0x00009888" value="0x0F84C000" />
+        <register type="NOA" address="0x00009888" value="0x0384C000" />
+        <register type="NOA" address="0x00009888" value="0x0584C000" />
+        <register type="NOA" address="0x00009888" value="0x1180C000" />
+        <register type="NOA" address="0x00009888" value="0x1780C000" />
+        <register type="NOA" address="0x00009888" value="0x1980C000" />
+        <register type="NOA" address="0x00009888" value="0x1B80C000" />
+        <register type="NOA" address="0x00009888" value="0x1D80C000" />
+        <register type="NOA" address="0x00009888" value="0x1F80C000" />
+        <register type="NOA" address="0x00009888" value="0x1380C000" />
+        <register type="NOA" address="0x00009888" value="0x1580C000" />
+        <register type="NOA" address="0x00000D24" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x4D801111" />
+        <register type="NOA" address="0x00009888" value="0x3D800800" />
+        <register type="NOA" address="0x00009888" value="0x4F801011" />
+        <register type="NOA" address="0x00009888" value="0x43800443" />
+        <register type="NOA" address="0x00009888" value="0x51801111" />
+        <register type="NOA" address="0x00009888" value="0x45800422" />
+        <register type="NOA" address="0x00009888" value="0x53801111" />
+        <register type="NOA" address="0x00009888" value="0x47800C60" />
+        <register type="NOA" address="0x00009888" value="0x21800000" />
+        <register type="NOA" address="0x00009888" value="0x31800000" />
+        <register type="NOA" address="0x00009888" value="0x3F800422" />
+        <register type="NOA" address="0x00009888" value="0x41800021" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007FFEA" />
+        <register type="OA" address="0x00002774" value="0x00007FFC" />
+        <register type="OA" address="0x00002778" value="0x0007AFFA" />
+        <register type="OA" address="0x0000277C" value="0x0000F5FD" />
+        <register type="OA" address="0x00002780" value="0x00079FFA" />
+        <register type="OA" address="0x00002784" value="0x0000F3FB" />
+        <register type="OA" address="0x00002788" value="0x0007BF7A" />
+        <register type="OA" address="0x0000278C" value="0x0000F7E7" />
+        <register type="OA" address="0x00002790" value="0x0007FEFA" />
+        <register type="OA" address="0x00002794" value="0x0000F7CF" />
+        <register type="OA" address="0x00002798" value="0x00077FFA" />
+        <register type="OA" address="0x0000279C" value="0x0000EFDF" />
+        <register type="OA" address="0x000027A0" value="0x0006FFFA" />
+        <register type="OA" address="0x000027A4" value="0x0000CFBF" />
+        <register type="OA" address="0x000027A8" value="0x0003FFFA" />
+        <register type="OA" address="0x000027AC" value="0x00005F7F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00015014" />
+        <register type="FLEX" address="0x0000E658" value="0x00025024" />
+        <register type="FLEX" address="0x0000E758" value="0x00035034" />
+        <register type="FLEX" address="0x0000E45C" value="0x00045044" />
+        <register type="FLEX" address="0x0000E55C" value="0x00055054" />
+        <register type="FLEX" address="0x0000E65C" value="0x00065064" />
+    </register_config>
+  </set>
+
+  <set name="Memory Reads Distribution Gen8"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="memory_reads"
+       hw_config_guid="2b255d48-2117-4fef-a8f7-f151e1d25a2c"
+       chipset="BDW"
+       symbol_name="MemoryReads"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiL3Bank0Reads"
+             description="The total number of GTI memory reads from L3 Bank 0 (L3 Cache misses)."
+             data_type="uint64"
+             equation="C 4 READ"
+             underscore_name="gti_l3_bank0_reads"
+             units="messages"
+             symbol_name="GtiL3Bank0Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="GtiRingAccesses"
+             description="The total number of all accesses from GTI to the ring."
+             data_type="uint64"
+             equation="C 3 READ 2 UMUL"
+             underscore_name="gti_ring_accesses"
+             units="messages"
+             symbol_name="GtiRingAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="GtiL3Bank3Reads"
+             description="The total number of GTI memory reads from L3 Bank 3 (L3 Cache misses)."
+             data_type="uint64"
+             equation="C 7 READ"
+             underscore_name="gti_l3_bank3_reads"
+             units="messages"
+             symbol_name="GtiL3Bank3Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="GtiRsMemoryReads"
+             description="The total number of GTI memory reads from Resource Streamer."
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="gti_rs_memory_reads"
+             units="messages"
+             symbol_name="GtiRsMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Resource Streamer"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GtiHizMemoryReads"
+             description="The total number of GTI memory reads from Hierarchical Depth Cache (Hi-Depth Cache misses)."
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="gti_hiz_memory_reads"
+             units="messages"
+             symbol_name="GtiHizMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="GtiRccMemoryReads"
+             description="The total number of GTI memory reads from Render Color Cache (Render Color Cache misses)."
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="gti_rcc_memory_reads"
+             units="messages"
+             symbol_name="GtiRccMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Color Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiL3Bank1Reads"
+             description="The total number of GTI memory reads from L3 Bank 1 (L3 Cache misses)."
+             data_type="uint64"
+             equation="C 5 READ"
+             underscore_name="gti_l3_bank1_reads"
+             units="messages"
+             symbol_name="GtiL3Bank1Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiCmdStreamerMemoryReads"
+             description="The total number of GTI memory reads from Command Streamer."
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="gti_cmd_streamer_memory_reads"
+             units="messages"
+             symbol_name="GtiCmdStreamerMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Command Streamer"
+             />
+    <counter name="GtiL3Bank2Reads"
+             description="The total number of GTI memory reads from L3 Bank 2 (L3 Cache misses)."
+             data_type="uint64"
+             equation="C 6 READ"
+             underscore_name="gti_l3_bank2_reads"
+             units="messages"
+             symbol_name="GtiL3Bank2Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiMemoryReads"
+             description="The total number of GTI memory reads."
+             data_type="uint64"
+             equation="C 0 READ"
+             underscore_name="gti_memory_reads"
+             units="messages"
+             symbol_name="GtiMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="GtiRczMemoryReads"
+             description="The total number of GTI memory reads from Render Depth Cache (Render Depth Cache misses)."
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="gti_rcz_memory_reads"
+             units="messages"
+             symbol_name="GtiRczMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="GtiMscMemoryReads"
+             description="The total number of GTI memory reads from Multisampling Color Cache (Multisampling Color Cache misses)."
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="gti_msc_memory_reads"
+             units="messages"
+             symbol_name="GtiMscMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Color Cache"
+             />
+    <counter name="GtiVfMemoryReads"
+             description="The total number of GTI memory reads from Vertex Fetch."
+             data_type="uint64"
+             equation="B 1 READ"
+             underscore_name="gti_vf_memory_reads"
+             units="messages"
+             symbol_name="GtiVfMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Vertex Fetch"
+             />
+    <counter name="GtiStcMemoryReads"
+             description="The total number of GTI memory reads from Stencil Cache (Stencil Cache misses)."
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="gti_stc_memory_reads"
+             units="messages"
+             symbol_name="GtiStcMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL 2 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses UADD UADD 64 UMUL"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="GtiL3Reads"
+             description="The total number of GTI memory reads from L3 (L3 Cache misses)."
+             data_type="uint64"
+             equation="$GtiL3Bank0Reads $GtiL3Bank1Reads $GtiL3Bank2Reads $GtiL3Bank3Reads UADD UADD UADD"
+             underscore_name="gti_l3_reads"
+             units="messages"
+             symbol_name="GtiL3Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x198B0343" />
+        <register type="NOA" address="0x00009888" value="0x13845800" />
+        <register type="NOA" address="0x00009888" value="0x15840018" />
+        <register type="NOA" address="0x00009888" value="0x3580001A" />
+        <register type="NOA" address="0x00009888" value="0x038B6300" />
+        <register type="NOA" address="0x00009888" value="0x058B6B62" />
+        <register type="NOA" address="0x00009888" value="0x078B006A" />
+        <register type="NOA" address="0x00009888" value="0x118B0000" />
+        <register type="NOA" address="0x00009888" value="0x238B0000" />
+        <register type="NOA" address="0x00009888" value="0x258B0000" />
+        <register type="NOA" address="0x00009888" value="0x1F85A080" />
+        <register type="NOA" address="0x00009888" value="0x2185AAAA" />
+        <register type="NOA" address="0x00009888" value="0x2385000A" />
+        <register type="NOA" address="0x00009888" value="0x07834000" />
+        <register type="NOA" address="0x00009888" value="0x09834000" />
+        <register type="NOA" address="0x00009888" value="0x0B834000" />
+        <register type="NOA" address="0x00009888" value="0x0D834000" />
+        <register type="NOA" address="0x00009888" value="0x01840018" />
+        <register type="NOA" address="0x00009888" value="0x07844C80" />
+        <register type="NOA" address="0x00009888" value="0x09840D9A" />
+        <register type="NOA" address="0x00009888" value="0x0B840E9C" />
+        <register type="NOA" address="0x00009888" value="0x0D840F9E" />
+        <register type="NOA" address="0x00009888" value="0x0F840010" />
+        <register type="NOA" address="0x00009888" value="0x11840000" />
+        <register type="NOA" address="0x00009888" value="0x03848000" />
+        <register type="NOA" address="0x00009888" value="0x0584C000" />
+        <register type="NOA" address="0x00009888" value="0x2F8000E5" />
+        <register type="NOA" address="0x00009888" value="0x138080E3" />
+        <register type="NOA" address="0x00009888" value="0x1580C0E1" />
+        <register type="NOA" address="0x00009888" value="0x21800000" />
+        <register type="NOA" address="0x00009888" value="0x11804000" />
+        <register type="NOA" address="0x00009888" value="0x1780C000" />
+        <register type="NOA" address="0x00009888" value="0x1980C000" />
+        <register type="NOA" address="0x00009888" value="0x1B80C000" />
+        <register type="NOA" address="0x00009888" value="0x1D80C000" />
+        <register type="NOA" address="0x00009888" value="0x1F804000" />
+        <register type="NOA" address="0x00000D24" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x4D800000" />
+        <register type="NOA" address="0x00009888" value="0x3D800800" />
+        <register type="NOA" address="0x00009888" value="0x4F800000" />
+        <register type="NOA" address="0x00009888" value="0x43800842" />
+        <register type="NOA" address="0x00009888" value="0x51800000" />
+        <register type="NOA" address="0x00009888" value="0x45800842" />
+        <register type="NOA" address="0x00009888" value="0x53800000" />
+        <register type="NOA" address="0x00009888" value="0x47801042" />
+        <register type="NOA" address="0x00009888" value="0x31800000" />
+        <register type="NOA" address="0x00009888" value="0x3F800084" />
+        <register type="NOA" address="0x00009888" value="0x41800000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x0000274C" value="0x86543210" />
+        <register type="OA" address="0x00002748" value="0x86543210" />
+        <register type="OA" address="0x00002744" value="0x00006667" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x0000275C" value="0x86543210" />
+        <register type="OA" address="0x00002758" value="0x86543210" />
+        <register type="OA" address="0x00002754" value="0x00006465" />
+        <register type="OA" address="0x00002750" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007F81A" />
+        <register type="OA" address="0x00002774" value="0x0000FE00" />
+        <register type="OA" address="0x00002778" value="0x0007F82A" />
+        <register type="OA" address="0x0000277C" value="0x0000FE00" />
+        <register type="OA" address="0x00002780" value="0x0007F872" />
+        <register type="OA" address="0x00002784" value="0x0000FE00" />
+        <register type="OA" address="0x00002788" value="0x0007F8BA" />
+        <register type="OA" address="0x0000278C" value="0x0000FE00" />
+        <register type="OA" address="0x00002790" value="0x0007F87A" />
+        <register type="OA" address="0x00002794" value="0x0000FE00" />
+        <register type="OA" address="0x00002798" value="0x0007F8EA" />
+        <register type="OA" address="0x0000279C" value="0x0000FE00" />
+        <register type="OA" address="0x000027A0" value="0x0007F8E2" />
+        <register type="OA" address="0x000027A4" value="0x0000FE00" />
+        <register type="OA" address="0x000027A8" value="0x0007F8F2" />
+        <register type="OA" address="0x000027AC" value="0x0000FE00" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00015014" />
+        <register type="FLEX" address="0x0000E658" value="0x00025024" />
+        <register type="FLEX" address="0x0000E758" value="0x00035034" />
+        <register type="FLEX" address="0x0000E45C" value="0x00045044" />
+        <register type="FLEX" address="0x0000E55C" value="0x00055054" />
+        <register type="FLEX" address="0x0000E65C" value="0x00065064" />
+    </register_config>
+  </set>
+
+  <set name="Memory Writes Distribution Gen8"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="memory_writes"
+       hw_config_guid="f7fd3220-b466-4a4d-9f98-b0caf3f2394c"
+       chipset="BDW"
+       symbol_name="MemoryWrites"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiMemoryWrites"
+             description="The total number of GTI memory writes."
+             data_type="uint64"
+             equation="C 0 READ"
+             underscore_name="gti_memory_writes"
+             units="messages"
+             symbol_name="GtiMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="GtiRingAccesses"
+             description="The total number of all GTI accesses to the ring."
+             data_type="uint64"
+             equation="C 3 READ 2 UMUL"
+             underscore_name="gti_ring_accesses"
+             units="messages"
+             symbol_name="GtiRingAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="GtiMscMemoryWrites"
+             description="The total number of GTI memory writes from Multisampling Color Cache (Multisampling Color Cache invalidations)."
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="gti_msc_memory_writes"
+             units="messages"
+             symbol_name="GtiMscMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Color Cache"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="GtiCmdStreamerMemoryWrites"
+             description="The total number of GTI memory writes from Command Streamer."
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="gti_cmd_streamer_memory_writes"
+             units="messages"
+             symbol_name="GtiCmdStreamerMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Command Streamer"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GtiL3Bank0Writes"
+             description="The total number of GTI memory writes from L3 Bank 0 (L3 Bank 0 invalidations)."
+             data_type="uint64"
+             equation="C 4 READ"
+             underscore_name="gti_l3_bank0_writes"
+             units="messages"
+             symbol_name="GtiL3Bank0Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiL3Bank1Writes"
+             description="The total number of GTI memory writes from L3 Bank 1 (L3 Bank 1 invalidations)."
+             data_type="uint64"
+             equation="C 5 READ"
+             underscore_name="gti_l3_bank1_writes"
+             units="messages"
+             symbol_name="GtiL3Bank1Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiL3Bank2Writes"
+             description="The total number of GTI memory writes from L3 Bank 2 (L3 Bank 2 invalidations)."
+             data_type="uint64"
+             equation="C 6 READ"
+             underscore_name="gti_l3_bank2_writes"
+             units="messages"
+             symbol_name="GtiL3Bank2Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiL3Bank3Writes"
+             description="The total number of GTI memory writes from L3 Bank 3 (L3 Bank 3 invalidations)."
+             data_type="uint64"
+             equation="C 7 READ"
+             underscore_name="gti_l3_bank3_writes"
+             units="messages"
+             symbol_name="GtiL3Bank3Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiL3Writes"
+             description="The total number of GTI memory writes from L3 (L3 invalidations)."
+             data_type="uint64"
+             equation="$GtiL3Bank0Writes $GtiL3Bank1Writes $GtiL3Bank2Writes $GtiL3Bank3Writes UADD UADD UADD"
+             underscore_name="gti_l3_writes"
+             units="messages"
+             symbol_name="GtiL3Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiRccMemoryWrites"
+             description="The total number of GTI memory writes from Render Color Cache (Render Color Cache invalidations)."
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="gti_rcc_memory_writes"
+             units="messages"
+             symbol_name="GtiRccMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Color Cache"
+             />
+    <counter name="GtiSoMemoryWrites"
+             description="The total number of GTI memory writes from Stream Output."
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="gti_so_memory_writes"
+             units="messages"
+             symbol_name="GtiSoMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Stream Output"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiStcMemoryWrites"
+             description="The total number of GTI memory writes from Stencil Cache."
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="gti_stc_memory_writes"
+             units="messages"
+             symbol_name="GtiStcMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="GtiRczMemoryWrites"
+             description="The total number of GTI memory writes from Render Depth Cache."
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="gti_rcz_memory_writes"
+             units="messages"
+             symbol_name="GtiRczMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL 2 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses UADD UADD 64 UMUL"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="GtiHizMemoryWrites"
+             description="The total number of GTI memory writes from Hierarchical Depth Cache."
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="gti_hiz_memory_writes"
+             units="messages"
+             symbol_name="GtiHizMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x198B0343" />
+        <register type="NOA" address="0x00009888" value="0x13845400" />
+        <register type="NOA" address="0x00009888" value="0x3580001A" />
+        <register type="NOA" address="0x00009888" value="0x3D800805" />
+        <register type="NOA" address="0x00009888" value="0x038B6300" />
+        <register type="NOA" address="0x00009888" value="0x058B6B62" />
+        <register type="NOA" address="0x00009888" value="0x078B006A" />
+        <register type="NOA" address="0x00009888" value="0x118B0000" />
+        <register type="NOA" address="0x00009888" value="0x238B0000" />
+        <register type="NOA" address="0x00009888" value="0x258B0000" />
+        <register type="NOA" address="0x00009888" value="0x1F85A080" />
+        <register type="NOA" address="0x00009888" value="0x2185AAAA" />
+        <register type="NOA" address="0x00009888" value="0x23850002" />
+        <register type="NOA" address="0x00009888" value="0x07834000" />
+        <register type="NOA" address="0x00009888" value="0x09834000" />
+        <register type="NOA" address="0x00009888" value="0x0B834000" />
+        <register type="NOA" address="0x00009888" value="0x0D834000" />
+        <register type="NOA" address="0x00009888" value="0x01840010" />
+        <register type="NOA" address="0x00009888" value="0x07844880" />
+        <register type="NOA" address="0x00009888" value="0x09840992" />
+        <register type="NOA" address="0x00009888" value="0x0B840A94" />
+        <register type="NOA" address="0x00009888" value="0x0D840B96" />
+        <register type="NOA" address="0x00009888" value="0x11840000" />
+        <register type="NOA" address="0x00009888" value="0x03848000" />
+        <register type="NOA" address="0x00009888" value="0x0584C000" />
+        <register type="NOA" address="0x00009888" value="0x2D800147" />
+        <register type="NOA" address="0x00009888" value="0x2F8000E5" />
+        <register type="NOA" address="0x00009888" value="0x138080E3" />
+        <register type="NOA" address="0x00009888" value="0x1580C0E1" />
+        <register type="NOA" address="0x00009888" value="0x21800000" />
+        <register type="NOA" address="0x00009888" value="0x11804000" />
+        <register type="NOA" address="0x00009888" value="0x1780C000" />
+        <register type="NOA" address="0x00009888" value="0x1980C000" />
+        <register type="NOA" address="0x00009888" value="0x1B80C000" />
+        <register type="NOA" address="0x00009888" value="0x1D80C000" />
+        <register type="NOA" address="0x00009888" value="0x1F800000" />
+        <register type="NOA" address="0x00000D24" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x4D800000" />
+        <register type="NOA" address="0x00009888" value="0x4F800000" />
+        <register type="NOA" address="0x00009888" value="0x43800842" />
+        <register type="NOA" address="0x00009888" value="0x51800000" />
+        <register type="NOA" address="0x00009888" value="0x45800842" />
+        <register type="NOA" address="0x00009888" value="0x53800000" />
+        <register type="NOA" address="0x00009888" value="0x47801082" />
+        <register type="NOA" address="0x00009888" value="0x31800000" />
+        <register type="NOA" address="0x00009888" value="0x3F800084" />
+        <register type="NOA" address="0x00009888" value="0x41800000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x0000274C" value="0x86543210" />
+        <register type="OA" address="0x00002748" value="0x86543210" />
+        <register type="OA" address="0x00002744" value="0x00006667" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x0000275C" value="0x86543210" />
+        <register type="OA" address="0x00002758" value="0x86543210" />
+        <register type="OA" address="0x00002754" value="0x00006465" />
+        <register type="OA" address="0x00002750" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007F81A" />
+        <register type="OA" address="0x00002774" value="0x0000FE00" />
+        <register type="OA" address="0x00002778" value="0x0007F82A" />
+        <register type="OA" address="0x0000277C" value="0x0000FE00" />
+        <register type="OA" address="0x00002780" value="0x0007F822" />
+        <register type="OA" address="0x00002784" value="0x0000FE00" />
+        <register type="OA" address="0x00002788" value="0x0007F8BA" />
+        <register type="OA" address="0x0000278C" value="0x0000FE00" />
+        <register type="OA" address="0x00002790" value="0x0007F87A" />
+        <register type="OA" address="0x00002794" value="0x0000FE00" />
+        <register type="OA" address="0x00002798" value="0x0007F8EA" />
+        <register type="OA" address="0x0000279C" value="0x0000FE00" />
+        <register type="OA" address="0x000027A0" value="0x0007F8E2" />
+        <register type="OA" address="0x000027A4" value="0x0000FE00" />
+        <register type="OA" address="0x000027A8" value="0x0007F8F2" />
+        <register type="OA" address="0x000027AC" value="0x0000FE00" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00015014" />
+        <register type="FLEX" address="0x0000E658" value="0x00025024" />
+        <register type="FLEX" address="0x0000E758" value="0x00035034" />
+        <register type="FLEX" address="0x0000E45C" value="0x00045044" />
+        <register type="FLEX" address="0x0000E55C" value="0x00055054" />
+        <register type="FLEX" address="0x0000E65C" value="0x00065064" />
+    </register_config>
+  </set>
+
+  <set name="Compute Metrics Extended Gen8"
+       mdapi_supported_apis="VK OGL4 OCL IO BB"
+       underscore_name="compute_extended"
+       hw_config_guid="e99ccaca-821c-4df9-97a7-96bdb7204e43"
+       chipset="BDW"
+       symbol_name="ComputeExtended"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu0_active"
+             units="percent"
+             symbol_name="Fpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active"
+             units="percent"
+             symbol_name="Fpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU AVG IPC Rate"
+             description="The average rate of IPC calculated for 2 FPU pipelines."
+             data_type="float"
+             max_equation="2"
+             equation="A 9 READ  A 10 READ  A 11 READ UADD  A 9 READ USUB FDIV 1 FADD"
+             underscore_name="eu_avg_ipc_rate"
+             units="number"
+             symbol_name="EuAvgIpcRate"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Typed Writes 0"
+             description="The subslice 0 typed writes."
+             data_type="uint64"
+             equation="C 0 READ"
+             underscore_name="typed_writes0"
+             units="messages"
+             symbol_name="TypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuTypedAtomics0"
+             description="The subslice 0 EU Typed Atomics subslice 0."
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="eu_typed_atomics0"
+             units="messages"
+             symbol_name="EuTypedAtomics0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Typed Atomics 0"
+             description="The subslice 0 typed atomics."
+             data_type="uint64"
+             equation="C 4 READ"
+             underscore_name="typed_atomics0"
+             units="messages"
+             symbol_name="TypedAtomics0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="TypedAtomicsPerCacheLine"
+             description="Ratio of EU typed atomics requests to L3 cache line writes."
+             data_type="float"
+             equation="$EuTypedAtomics0 $TypedAtomics0 FDIV"
+             underscore_name="typed_atomics_per_cache_line"
+             units="eu atomic requests to l3 cache lines"
+             symbol_name="TypedAtomicsPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuUntypedReads0"
+             description="The subslice 0 EU Untyped Reads subslice 0."
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="eu_untyped_reads0"
+             units="messages"
+             symbol_name="EuUntypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Untyped Writes 0"
+             description="The subslice 0 untyped writes (including SLM writes)."
+             data_type="uint64"
+             equation="C 1 READ"
+             underscore_name="untyped_writes0"
+             units="messages"
+             symbol_name="UntypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuUntypedAtomics0"
+             description="The subslice 0 EU Untyped Atomics subslice 0."
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="eu_untyped_atomics0"
+             units="messages"
+             symbol_name="EuUntypedAtomics0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuUntypedWrites0"
+             description="The subslice 0 EU Untyped Writes subslice 0."
+             data_type="uint64"
+             equation="B 1 READ"
+             underscore_name="eu_untyped_writes0"
+             units="messages"
+             symbol_name="EuUntypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuA64UntypedWrites0"
+             description="The subslice 0 EU A64 Untyped Writes subslice 0."
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="eu_a64_untyped_writes0"
+             units="messages"
+             symbol_name="EuA64UntypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="UntypedWritesPerCacheLine"
+             description="Ratio of EU untyped write requests to L3 cache line writes."
+             data_type="float"
+             equation="$EuUntypedWrites0 $EuA64UntypedWrites0 UADD $UntypedWrites0 FDIV"
+             underscore_name="untyped_writes_per_cache_line"
+             units="eu requests to l3 cache lines"
+             symbol_name="UntypedWritesPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EuTypedWrites0"
+             description="The subslice 0 EU Typed Writes subslice 0."
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="eu_typed_writes0"
+             units="messages"
+             symbol_name="EuTypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="TypedWritesPerCacheLine"
+             description="Ratio of EU typed write requests to L3 cache line writes."
+             data_type="float"
+             equation="$EuTypedWrites0 $TypedWrites0 FDIV"
+             underscore_name="typed_writes_per_cache_line"
+             units="eu requests to l3 cache lines"
+             symbol_name="TypedWritesPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Typed Reads 0"
+             description="The subslice 0 typed reads."
+             data_type="uint64"
+             equation="C 2 READ"
+             underscore_name="typed_reads0"
+             units="messages"
+             symbol_name="TypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Untyped Reads 0"
+             description="The subslice 0 untyped reads (including SLM reads)."
+             data_type="uint64"
+             equation="C 3 READ"
+             underscore_name="untyped_reads0"
+             units="messages"
+             symbol_name="UntypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuA64UntypedReads0"
+             description="The subslice 0 EU A64 Untyped Reads subslice 0."
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="eu_a64_untyped_reads0"
+             units="messages"
+             symbol_name="EuA64UntypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EU Thread Occupancy"
+             description="The percentage of time in which hardware threads occupied EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ 8 UMUL $EuCoresTotalCount UDIV $EuThreadsCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_thread_occupancy"
+             units="percent"
+             symbol_name="EuThreadOccupancy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EuTypedReads0"
+             description="The subslice 0 EU Typed Reads subslice 0."
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="eu_typed_reads0"
+             units="messages"
+             symbol_name="EuTypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="UntypedReadsPerCacheLine"
+             description="Ratio of EU untyped read requests to L3 cache line reads."
+             data_type="float"
+             equation="$EuUntypedReads0 $EuA64UntypedReads0 UADD $UntypedReads0 FDIV"
+             underscore_name="untyped_reads_per_cache_line"
+             units="eu requests to l3 cache lines"
+             symbol_name="UntypedReadsPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="TypedReadsPerCacheLine"
+             description="Ratio of EU typed read requests to L3 cache line reads."
+             data_type="float"
+             equation="$EuTypedReads0 $TypedReads0 FDIV"
+             underscore_name="typed_reads_per_cache_line"
+             units="eu requests to l3 cache lines"
+             symbol_name="TypedReadsPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL 2 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses UADD UADD 64 UMUL"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="EU Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_send_active"
+             units="percent"
+             symbol_name="EuSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA"
+                     availability="$SubsliceMask 0x01 AND"
+                     priority="0"
+                     >
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x143D0160" />
+        <register type="NOA" address="0x00009888" value="0x163D2800" />
+        <register type="NOA" address="0x00009888" value="0x183D0120" />
+        <register type="NOA" address="0x00009888" value="0x105800E0" />
+        <register type="NOA" address="0x00009888" value="0x005CC000" />
+        <register type="NOA" address="0x00009888" value="0x065C8000" />
+        <register type="NOA" address="0x00009888" value="0x085CC000" />
+        <register type="NOA" address="0x00009888" value="0x0A5CC000" />
+        <register type="NOA" address="0x00009888" value="0x0C5CC000" />
+        <register type="NOA" address="0x00009888" value="0x0E5CC000" />
+        <register type="NOA" address="0x00009888" value="0x025CC000" />
+        <register type="NOA" address="0x00009888" value="0x045CC000" />
+        <register type="NOA" address="0x00009888" value="0x003D0011" />
+        <register type="NOA" address="0x00009888" value="0x063D0900" />
+        <register type="NOA" address="0x00009888" value="0x083D0A13" />
+        <register type="NOA" address="0x00009888" value="0x0A3D0B15" />
+        <register type="NOA" address="0x00009888" value="0x0C3D2317" />
+        <register type="NOA" address="0x00009888" value="0x043D21B7" />
+        <register type="NOA" address="0x00009888" value="0x103D0000" />
+        <register type="NOA" address="0x00009888" value="0x0E3D0000" />
+        <register type="NOA" address="0x00009888" value="0x1A3D0000" />
+        <register type="NOA" address="0x00009888" value="0x0E5825C1" />
+        <register type="NOA" address="0x00009888" value="0x00586100" />
+        <register type="NOA" address="0x00009888" value="0x0258204C" />
+        <register type="NOA" address="0x00009888" value="0x06588000" />
+        <register type="NOA" address="0x00009888" value="0x0858C000" />
+        <register type="NOA" address="0x00009888" value="0x0A58C000" />
+        <register type="NOA" address="0x00009888" value="0x0C58C000" />
+        <register type="NOA" address="0x00009888" value="0x0458C000" />
+        <register type="NOA" address="0x00009888" value="0x005B4000" />
+        <register type="NOA" address="0x00009888" value="0x0E5B4000" />
+        <register type="NOA" address="0x00009888" value="0x185B5400" />
+        <register type="NOA" address="0x00009888" value="0x1A5B0155" />
+        <register type="NOA" address="0x00009888" value="0x025B4000" />
+        <register type="NOA" address="0x00009888" value="0x045B4000" />
+        <register type="NOA" address="0x00009888" value="0x065B4000" />
+        <register type="NOA" address="0x00009888" value="0x085B4000" />
+        <register type="NOA" address="0x00009888" value="0x0A5B4000" />
+        <register type="NOA" address="0x00009888" value="0x0C1FA800" />
+        <register type="NOA" address="0x00009888" value="0x0E1FAA2A" />
+        <register type="NOA" address="0x00009888" value="0x101F02AA" />
+        <register type="NOA" address="0x00009888" value="0x00384000" />
+        <register type="NOA" address="0x00009888" value="0x0E384000" />
+        <register type="NOA" address="0x00009888" value="0x16384000" />
+        <register type="NOA" address="0x00009888" value="0x18381555" />
+        <register type="NOA" address="0x00009888" value="0x02384000" />
+        <register type="NOA" address="0x00009888" value="0x04384000" />
+        <register type="NOA" address="0x00009888" value="0x06384000" />
+        <register type="NOA" address="0x00009888" value="0x08384000" />
+        <register type="NOA" address="0x00009888" value="0x0A384000" />
+        <register type="NOA" address="0x00009888" value="0x0039A000" />
+        <register type="NOA" address="0x00009888" value="0x06398000" />
+        <register type="NOA" address="0x00009888" value="0x0839A000" />
+        <register type="NOA" address="0x00009888" value="0x0A39A000" />
+        <register type="NOA" address="0x00009888" value="0x0C39A000" />
+        <register type="NOA" address="0x00009888" value="0x0E39A000" />
+        <register type="NOA" address="0x00009888" value="0x0239A000" />
+        <register type="NOA" address="0x00009888" value="0x0439A000" />
+        <register type="NOA" address="0x00009888" value="0x018A8000" />
+        <register type="NOA" address="0x00009888" value="0x0F8A8000" />
+        <register type="NOA" address="0x00009888" value="0x198A8000" />
+        <register type="NOA" address="0x00009888" value="0x1B8AAAA0" />
+        <register type="NOA" address="0x00009888" value="0x1D8A0002" />
+        <register type="NOA" address="0x00009888" value="0x038A8000" />
+        <register type="NOA" address="0x00009888" value="0x058A8000" />
+        <register type="NOA" address="0x00009888" value="0x078A8000" />
+        <register type="NOA" address="0x00009888" value="0x098A8000" />
+        <register type="NOA" address="0x00009888" value="0x0B8A8000" />
+        <register type="NOA" address="0x00009888" value="0x238B2AA0" />
+        <register type="NOA" address="0x00009888" value="0x258B5551" />
+        <register type="NOA" address="0x00009888" value="0x278B0015" />
+        <register type="NOA" address="0x00009888" value="0x1F85AA80" />
+        <register type="NOA" address="0x00009888" value="0x2185AAA2" />
+        <register type="NOA" address="0x00009888" value="0x2385002A" />
+        <register type="NOA" address="0x00009888" value="0x01834000" />
+        <register type="NOA" address="0x00009888" value="0x0F834000" />
+        <register type="NOA" address="0x00009888" value="0x19835400" />
+        <register type="NOA" address="0x00009888" value="0x1B830155" />
+        <register type="NOA" address="0x00009888" value="0x03834000" />
+        <register type="NOA" address="0x00009888" value="0x05834000" />
+        <register type="NOA" address="0x00009888" value="0x07834000" />
+        <register type="NOA" address="0x00009888" value="0x09834000" />
+        <register type="NOA" address="0x00009888" value="0x0B834000" />
+        <register type="NOA" address="0x00009888" value="0x0184C000" />
+        <register type="NOA" address="0x00009888" value="0x07848000" />
+        <register type="NOA" address="0x00009888" value="0x0984C000" />
+        <register type="NOA" address="0x00009888" value="0x0B84C000" />
+        <register type="NOA" address="0x00009888" value="0x0D84C000" />
+        <register type="NOA" address="0x00009888" value="0x0F84C000" />
+        <register type="NOA" address="0x00009888" value="0x0384C000" />
+        <register type="NOA" address="0x00009888" value="0x0584C000" />
+        <register type="NOA" address="0x00009888" value="0x1180C000" />
+        <register type="NOA" address="0x00009888" value="0x17808000" />
+        <register type="NOA" address="0x00009888" value="0x1980C000" />
+        <register type="NOA" address="0x00009888" value="0x1B80C000" />
+        <register type="NOA" address="0x00009888" value="0x1D80C000" />
+        <register type="NOA" address="0x00009888" value="0x1F80C000" />
+        <register type="NOA" address="0x00009888" value="0x1380C000" />
+        <register type="NOA" address="0x00009888" value="0x1580C000" />
+        <register type="NOA" address="0x00000D24" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x4D800000" />
+        <register type="NOA" address="0x00009888" value="0x3D800000" />
+        <register type="NOA" address="0x00009888" value="0x4F800000" />
+        <register type="NOA" address="0x00009888" value="0x43800000" />
+        <register type="NOA" address="0x00009888" value="0x51800000" />
+        <register type="NOA" address="0x00009888" value="0x45800000" />
+        <register type="NOA" address="0x00009888" value="0x53800000" />
+        <register type="NOA" address="0x00009888" value="0x47800420" />
+        <register type="NOA" address="0x00009888" value="0x21800000" />
+        <register type="NOA" address="0x00009888" value="0x31800000" />
+        <register type="NOA" address="0x00009888" value="0x3F800421" />
+        <register type="NOA" address="0x00009888" value="0x41800000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+    </register_config>
+    <register_config type="NOA"
+                     availability="$SubsliceMask 0x02 AND"
+                     priority="2"
+                     >
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x105C00E0" />
+        <register type="NOA" address="0x00009888" value="0x145B0160" />
+        <register type="NOA" address="0x00009888" value="0x165B2800" />
+        <register type="NOA" address="0x00009888" value="0x185B0120" />
+        <register type="NOA" address="0x00009888" value="0x0E5C25C1" />
+        <register type="NOA" address="0x00009888" value="0x005C6100" />
+        <register type="NOA" address="0x00009888" value="0x025C204C" />
+        <register type="NOA" address="0x00009888" value="0x065C8000" />
+        <register type="NOA" address="0x00009888" value="0x085CC000" />
+        <register type="NOA" address="0x00009888" value="0x0A5CC000" />
+        <register type="NOA" address="0x00009888" value="0x0C5CC000" />
+        <register type="NOA" address="0x00009888" value="0x045CC000" />
+        <register type="NOA" address="0x00009888" value="0x005B0011" />
+        <register type="NOA" address="0x00009888" value="0x065B0900" />
+        <register type="NOA" address="0x00009888" value="0x085B0A13" />
+        <register type="NOA" address="0x00009888" value="0x0A5B0B15" />
+        <register type="NOA" address="0x00009888" value="0x0C5B2317" />
+        <register type="NOA" address="0x00009888" value="0x045B21B7" />
+        <register type="NOA" address="0x00009888" value="0x105B0000" />
+        <register type="NOA" address="0x00009888" value="0x0E5B0000" />
+        <register type="NOA" address="0x00009888" value="0x1A5B0000" />
+        <register type="NOA" address="0x00009888" value="0x0C1FA800" />
+        <register type="NOA" address="0x00009888" value="0x0E1FAA2A" />
+        <register type="NOA" address="0x00009888" value="0x101F02AA" />
+        <register type="NOA" address="0x00009888" value="0x00384000" />
+        <register type="NOA" address="0x00009888" value="0x0E384000" />
+        <register type="NOA" address="0x00009888" value="0x16384000" />
+        <register type="NOA" address="0x00009888" value="0x18381555" />
+        <register type="NOA" address="0x00009888" value="0x02384000" />
+        <register type="NOA" address="0x00009888" value="0x04384000" />
+        <register type="NOA" address="0x00009888" value="0x06384000" />
+        <register type="NOA" address="0x00009888" value="0x08384000" />
+        <register type="NOA" address="0x00009888" value="0x0A384000" />
+        <register type="NOA" address="0x00009888" value="0x0039A000" />
+        <register type="NOA" address="0x00009888" value="0x06398000" />
+        <register type="NOA" address="0x00009888" value="0x0839A000" />
+        <register type="NOA" address="0x00009888" value="0x0A39A000" />
+        <register type="NOA" address="0x00009888" value="0x0C39A000" />
+        <register type="NOA" address="0x00009888" value="0x0E39A000" />
+        <register type="NOA" address="0x00009888" value="0x0239A000" />
+        <register type="NOA" address="0x00009888" value="0x0439A000" />
+        <register type="NOA" address="0x00009888" value="0x018A8000" />
+        <register type="NOA" address="0x00009888" value="0x0F8A8000" />
+        <register type="NOA" address="0x00009888" value="0x198A8000" />
+        <register type="NOA" address="0x00009888" value="0x1B8AAAA0" />
+        <register type="NOA" address="0x00009888" value="0x1D8A0002" />
+        <register type="NOA" address="0x00009888" value="0x038A8000" />
+        <register type="NOA" address="0x00009888" value="0x058A8000" />
+        <register type="NOA" address="0x00009888" value="0x078A8000" />
+        <register type="NOA" address="0x00009888" value="0x098A8000" />
+        <register type="NOA" address="0x00009888" value="0x0B8A8000" />
+        <register type="NOA" address="0x00009888" value="0x238B2AA0" />
+        <register type="NOA" address="0x00009888" value="0x258B5551" />
+        <register type="NOA" address="0x00009888" value="0x278B0015" />
+        <register type="NOA" address="0x00009888" value="0x1F85AA80" />
+        <register type="NOA" address="0x00009888" value="0x2185AAA2" />
+        <register type="NOA" address="0x00009888" value="0x2385002A" />
+        <register type="NOA" address="0x00009888" value="0x01834000" />
+        <register type="NOA" address="0x00009888" value="0x0F834000" />
+        <register type="NOA" address="0x00009888" value="0x19835400" />
+        <register type="NOA" address="0x00009888" value="0x1B830155" />
+        <register type="NOA" address="0x00009888" value="0x03834000" />
+        <register type="NOA" address="0x00009888" value="0x05834000" />
+        <register type="NOA" address="0x00009888" value="0x07834000" />
+        <register type="NOA" address="0x00009888" value="0x09834000" />
+        <register type="NOA" address="0x00009888" value="0x0B834000" />
+        <register type="NOA" address="0x00009888" value="0x0184C000" />
+        <register type="NOA" address="0x00009888" value="0x07848000" />
+        <register type="NOA" address="0x00009888" value="0x0984C000" />
+        <register type="NOA" address="0x00009888" value="0x0B84C000" />
+        <register type="NOA" address="0x00009888" value="0x0D84C000" />
+        <register type="NOA" address="0x00009888" value="0x0F84C000" />
+        <register type="NOA" address="0x00009888" value="0x0384C000" />
+        <register type="NOA" address="0x00009888" value="0x0584C000" />
+        <register type="NOA" address="0x00009888" value="0x1180C000" />
+        <register type="NOA" address="0x00009888" value="0x17808000" />
+        <register type="NOA" address="0x00009888" value="0x1980C000" />
+        <register type="NOA" address="0x00009888" value="0x1B80C000" />
+        <register type="NOA" address="0x00009888" value="0x1D80C000" />
+        <register type="NOA" address="0x00009888" value="0x1F80C000" />
+        <register type="NOA" address="0x00009888" value="0x1380C000" />
+        <register type="NOA" address="0x00009888" value="0x1580C000" />
+        <register type="NOA" address="0x00000D24" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x4D800000" />
+        <register type="NOA" address="0x00009888" value="0x3D800000" />
+        <register type="NOA" address="0x00009888" value="0x4F800000" />
+        <register type="NOA" address="0x00009888" value="0x43800000" />
+        <register type="NOA" address="0x00009888" value="0x51800000" />
+        <register type="NOA" address="0x00009888" value="0x45800000" />
+        <register type="NOA" address="0x00009888" value="0x53800000" />
+        <register type="NOA" address="0x00009888" value="0x47800420" />
+        <register type="NOA" address="0x00009888" value="0x21800000" />
+        <register type="NOA" address="0x00009888" value="0x31800000" />
+        <register type="NOA" address="0x00009888" value="0x3F800421" />
+        <register type="NOA" address="0x00009888" value="0x41800000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+    </register_config>
+    <register_config type="NOA"
+                     availability="$SubsliceMask 0x04 AND"
+                     priority="4"
+                     >
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x103800E0" />
+        <register type="NOA" address="0x00009888" value="0x143A0160" />
+        <register type="NOA" address="0x00009888" value="0x163A2800" />
+        <register type="NOA" address="0x00009888" value="0x183A0120" />
+        <register type="NOA" address="0x00009888" value="0x0C1FA800" />
+        <register type="NOA" address="0x00009888" value="0x0E1FAA2A" />
+        <register type="NOA" address="0x00009888" value="0x101F02AA" />
+        <register type="NOA" address="0x00009888" value="0x0E38A5C1" />
+        <register type="NOA" address="0x00009888" value="0x0038A100" />
+        <register type="NOA" address="0x00009888" value="0x0238204C" />
+        <register type="NOA" address="0x00009888" value="0x16388000" />
+        <register type="NOA" address="0x00009888" value="0x183802AA" />
+        <register type="NOA" address="0x00009888" value="0x04380000" />
+        <register type="NOA" address="0x00009888" value="0x06380000" />
+        <register type="NOA" address="0x00009888" value="0x08388000" />
+        <register type="NOA" address="0x00009888" value="0x0A388000" />
+        <register type="NOA" address="0x00009888" value="0x0039A000" />
+        <register type="NOA" address="0x00009888" value="0x06398000" />
+        <register type="NOA" address="0x00009888" value="0x0839A000" />
+        <register type="NOA" address="0x00009888" value="0x0A39A000" />
+        <register type="NOA" address="0x00009888" value="0x0C39A000" />
+        <register type="NOA" address="0x00009888" value="0x0E39A000" />
+        <register type="NOA" address="0x00009888" value="0x0239A000" />
+        <register type="NOA" address="0x00009888" value="0x0439A000" />
+        <register type="NOA" address="0x00009888" value="0x003A0011" />
+        <register type="NOA" address="0x00009888" value="0x063A0900" />
+        <register type="NOA" address="0x00009888" value="0x083A0A13" />
+        <register type="NOA" address="0x00009888" value="0x0A3A0B15" />
+        <register type="NOA" address="0x00009888" value="0x0C3A2317" />
+        <register type="NOA" address="0x00009888" value="0x043A21B7" />
+        <register type="NOA" address="0x00009888" value="0x103A0000" />
+        <register type="NOA" address="0x00009888" value="0x0E3A0000" />
+        <register type="NOA" address="0x00009888" value="0x1A3A0000" />
+        <register type="NOA" address="0x00009888" value="0x018A8000" />
+        <register type="NOA" address="0x00009888" value="0x0F8A8000" />
+        <register type="NOA" address="0x00009888" value="0x198A8000" />
+        <register type="NOA" address="0x00009888" value="0x1B8AAAA0" />
+        <register type="NOA" address="0x00009888" value="0x1D8A0002" />
+        <register type="NOA" address="0x00009888" value="0x038A8000" />
+        <register type="NOA" address="0x00009888" value="0x058A8000" />
+        <register type="NOA" address="0x00009888" value="0x078A8000" />
+        <register type="NOA" address="0x00009888" value="0x098A8000" />
+        <register type="NOA" address="0x00009888" value="0x0B8A8000" />
+        <register type="NOA" address="0x00009888" value="0x238B2AA0" />
+        <register type="NOA" address="0x00009888" value="0x258B5551" />
+        <register type="NOA" address="0x00009888" value="0x278B0015" />
+        <register type="NOA" address="0x00009888" value="0x1F85AA80" />
+        <register type="NOA" address="0x00009888" value="0x2185AAA2" />
+        <register type="NOA" address="0x00009888" value="0x2385002A" />
+        <register type="NOA" address="0x00009888" value="0x01834000" />
+        <register type="NOA" address="0x00009888" value="0x0F834000" />
+        <register type="NOA" address="0x00009888" value="0x19835400" />
+        <register type="NOA" address="0x00009888" value="0x1B830155" />
+        <register type="NOA" address="0x00009888" value="0x03834000" />
+        <register type="NOA" address="0x00009888" value="0x05834000" />
+        <register type="NOA" address="0x00009888" value="0x07834000" />
+        <register type="NOA" address="0x00009888" value="0x09834000" />
+        <register type="NOA" address="0x00009888" value="0x0B834000" />
+        <register type="NOA" address="0x00009888" value="0x0184C000" />
+        <register type="NOA" address="0x00009888" value="0x07848000" />
+        <register type="NOA" address="0x00009888" value="0x0984C000" />
+        <register type="NOA" address="0x00009888" value="0x0B84C000" />
+        <register type="NOA" address="0x00009888" value="0x0D84C000" />
+        <register type="NOA" address="0x00009888" value="0x0F84C000" />
+        <register type="NOA" address="0x00009888" value="0x0384C000" />
+        <register type="NOA" address="0x00009888" value="0x0584C000" />
+        <register type="NOA" address="0x00009888" value="0x1180C000" />
+        <register type="NOA" address="0x00009888" value="0x17808000" />
+        <register type="NOA" address="0x00009888" value="0x1980C000" />
+        <register type="NOA" address="0x00009888" value="0x1B80C000" />
+        <register type="NOA" address="0x00009888" value="0x1D80C000" />
+        <register type="NOA" address="0x00009888" value="0x1F80C000" />
+        <register type="NOA" address="0x00009888" value="0x1380C000" />
+        <register type="NOA" address="0x00009888" value="0x1580C000" />
+        <register type="NOA" address="0x00000D24" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x4D800000" />
+        <register type="NOA" address="0x00009888" value="0x3D800000" />
+        <register type="NOA" address="0x00009888" value="0x4F800000" />
+        <register type="NOA" address="0x00009888" value="0x43800000" />
+        <register type="NOA" address="0x00009888" value="0x51800000" />
+        <register type="NOA" address="0x00009888" value="0x45800000" />
+        <register type="NOA" address="0x00009888" value="0x53800000" />
+        <register type="NOA" address="0x00009888" value="0x47800420" />
+        <register type="NOA" address="0x00009888" value="0x21800000" />
+        <register type="NOA" address="0x00009888" value="0x31800000" />
+        <register type="NOA" address="0x00009888" value="0x3F800421" />
+        <register type="NOA" address="0x00009888" value="0x41800000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+    </register_config>
+    <register_config type="NOA"
+                     availability="$SubsliceMask 0x08 AND"
+                     priority="1"
+                     >
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x14BD0160" />
+        <register type="NOA" address="0x00009888" value="0x16BD2800" />
+        <register type="NOA" address="0x00009888" value="0x18BD0120" />
+        <register type="NOA" address="0x00009888" value="0x10D800E0" />
+        <register type="NOA" address="0x00009888" value="0x00DCC000" />
+        <register type="NOA" address="0x00009888" value="0x06DC8000" />
+        <register type="NOA" address="0x00009888" value="0x08DCC000" />
+        <register type="NOA" address="0x00009888" value="0x0ADCC000" />
+        <register type="NOA" address="0x00009888" value="0x0CDCC000" />
+        <register type="NOA" address="0x00009888" value="0x0EDCC000" />
+        <register type="NOA" address="0x00009888" value="0x02DCC000" />
+        <register type="NOA" address="0x00009888" value="0x04DCC000" />
+        <register type="NOA" address="0x00009888" value="0x00BD0011" />
+        <register type="NOA" address="0x00009888" value="0x06BD0900" />
+        <register type="NOA" address="0x00009888" value="0x08BD0A13" />
+        <register type="NOA" address="0x00009888" value="0x0ABD0B15" />
+        <register type="NOA" address="0x00009888" value="0x0CBD2317" />
+        <register type="NOA" address="0x00009888" value="0x04BD21B7" />
+        <register type="NOA" address="0x00009888" value="0x10BD0000" />
+        <register type="NOA" address="0x00009888" value="0x0EBD0000" />
+        <register type="NOA" address="0x00009888" value="0x1ABD0000" />
+        <register type="NOA" address="0x00009888" value="0x0ED825C1" />
+        <register type="NOA" address="0x00009888" value="0x00D86100" />
+        <register type="NOA" address="0x00009888" value="0x02D8204C" />
+        <register type="NOA" address="0x00009888" value="0x06D88000" />
+        <register type="NOA" address="0x00009888" value="0x08D8C000" />
+        <register type="NOA" address="0x00009888" value="0x0AD8C000" />
+        <register type="NOA" address="0x00009888" value="0x0CD8C000" />
+        <register type="NOA" address="0x00009888" value="0x04D8C000" />
+        <register type="NOA" address="0x00009888" value="0x00DB4000" />
+        <register type="NOA" address="0x00009888" value="0x0EDB4000" />
+        <register type="NOA" address="0x00009888" value="0x18DB5400" />
+        <register type="NOA" address="0x00009888" value="0x1ADB0155" />
+        <register type="NOA" address="0x00009888" value="0x02DB4000" />
+        <register type="NOA" address="0x00009888" value="0x04DB4000" />
+        <register type="NOA" address="0x00009888" value="0x06DB4000" />
+        <register type="NOA" address="0x00009888" value="0x08DB4000" />
+        <register type="NOA" address="0x00009888" value="0x0ADB4000" />
+        <register type="NOA" address="0x00009888" value="0x0C9FA800" />
+        <register type="NOA" address="0x00009888" value="0x0E9FAA2A" />
+        <register type="NOA" address="0x00009888" value="0x109F02AA" />
+        <register type="NOA" address="0x00009888" value="0x00B84000" />
+        <register type="NOA" address="0x00009888" value="0x0EB84000" />
+        <register type="NOA" address="0x00009888" value="0x16B84000" />
+        <register type="NOA" address="0x00009888" value="0x18B81555" />
+        <register type="NOA" address="0x00009888" value="0x02B84000" />
+        <register type="NOA" address="0x00009888" value="0x04B84000" />
+        <register type="NOA" address="0x00009888" value="0x06B84000" />
+        <register type="NOA" address="0x00009888" value="0x08B84000" />
+        <register type="NOA" address="0x00009888" value="0x0AB84000" />
+        <register type="NOA" address="0x00009888" value="0x00B9A000" />
+        <register type="NOA" address="0x00009888" value="0x06B98000" />
+        <register type="NOA" address="0x00009888" value="0x08B9A000" />
+        <register type="NOA" address="0x00009888" value="0x0AB9A000" />
+        <register type="NOA" address="0x00009888" value="0x0CB9A000" />
+        <register type="NOA" address="0x00009888" value="0x0EB9A000" />
+        <register type="NOA" address="0x00009888" value="0x02B9A000" />
+        <register type="NOA" address="0x00009888" value="0x04B9A000" />
+        <register type="NOA" address="0x00009888" value="0x01888000" />
+        <register type="NOA" address="0x00009888" value="0x0D88F800" />
+        <register type="NOA" address="0x00009888" value="0x0F88000F" />
+        <register type="NOA" address="0x00009888" value="0x03888000" />
+        <register type="NOA" address="0x00009888" value="0x05888000" />
+        <register type="NOA" address="0x00009888" value="0x07888000" />
+        <register type="NOA" address="0x00009888" value="0x09888000" />
+        <register type="NOA" address="0x00009888" value="0x0B888000" />
+        <register type="NOA" address="0x00009888" value="0x238B5540" />
+        <register type="NOA" address="0x00009888" value="0x258BAAA2" />
+        <register type="NOA" address="0x00009888" value="0x278B002A" />
+        <register type="NOA" address="0x00009888" value="0x018C4000" />
+        <register type="NOA" address="0x00009888" value="0x0F8C4000" />
+        <register type="NOA" address="0x00009888" value="0x178C2000" />
+        <register type="NOA" address="0x00009888" value="0x198C5500" />
+        <register type="NOA" address="0x00009888" value="0x1B8C0015" />
+        <register type="NOA" address="0x00009888" value="0x038C4000" />
+        <register type="NOA" address="0x00009888" value="0x058C4000" />
+        <register type="NOA" address="0x00009888" value="0x078C4000" />
+        <register type="NOA" address="0x00009888" value="0x098C4000" />
+        <register type="NOA" address="0x00009888" value="0x0B8C4000" />
+        <register type="NOA" address="0x00009888" value="0x018DA000" />
+        <register type="NOA" address="0x00009888" value="0x078D8000" />
+        <register type="NOA" address="0x00009888" value="0x098DA000" />
+        <register type="NOA" address="0x00009888" value="0x0B8DA000" />
+        <register type="NOA" address="0x00009888" value="0x0D8DA000" />
+        <register type="NOA" address="0x00009888" value="0x0F8DA000" />
+        <register type="NOA" address="0x00009888" value="0x038DA000" />
+        <register type="NOA" address="0x00009888" value="0x058DA000" />
+        <register type="NOA" address="0x00009888" value="0x1F85AA80" />
+        <register type="NOA" address="0x00009888" value="0x2185AAA2" />
+        <register type="NOA" address="0x00009888" value="0x2385002A" />
+        <register type="NOA" address="0x00009888" value="0x01834000" />
+        <register type="NOA" address="0x00009888" value="0x0F834000" />
+        <register type="NOA" address="0x00009888" value="0x19835400" />
+        <register type="NOA" address="0x00009888" value="0x1B830155" />
+        <register type="NOA" address="0x00009888" value="0x03834000" />
+        <register type="NOA" address="0x00009888" value="0x05834000" />
+        <register type="NOA" address="0x00009888" value="0x07834000" />
+        <register type="NOA" address="0x00009888" value="0x09834000" />
+        <register type="NOA" address="0x00009888" value="0x0B834000" />
+        <register type="NOA" address="0x00009888" value="0x0184C000" />
+        <register type="NOA" address="0x00009888" value="0x07848000" />
+        <register type="NOA" address="0x00009888" value="0x0984C000" />
+        <register type="NOA" address="0x00009888" value="0x0B84C000" />
+        <register type="NOA" address="0x00009888" value="0x0D84C000" />
+        <register type="NOA" address="0x00009888" value="0x0F84C000" />
+        <register type="NOA" address="0x00009888" value="0x0384C000" />
+        <register type="NOA" address="0x00009888" value="0x0584C000" />
+        <register type="NOA" address="0x00009888" value="0x1180C000" />
+        <register type="NOA" address="0x00009888" value="0x17808000" />
+        <register type="NOA" address="0x00009888" value="0x1980C000" />
+        <register type="NOA" address="0x00009888" value="0x1B80C000" />
+        <register type="NOA" address="0x00009888" value="0x1D80C000" />
+        <register type="NOA" address="0x00009888" value="0x1F80C000" />
+        <register type="NOA" address="0x00009888" value="0x1380C000" />
+        <register type="NOA" address="0x00009888" value="0x1580C000" />
+        <register type="NOA" address="0x00000D24" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x4D800000" />
+        <register type="NOA" address="0x00009888" value="0x3D800000" />
+        <register type="NOA" address="0x00009888" value="0x4F800000" />
+        <register type="NOA" address="0x00009888" value="0x43800000" />
+        <register type="NOA" address="0x00009888" value="0x51800000" />
+        <register type="NOA" address="0x00009888" value="0x45800000" />
+        <register type="NOA" address="0x00009888" value="0x53800000" />
+        <register type="NOA" address="0x00009888" value="0x47800420" />
+        <register type="NOA" address="0x00009888" value="0x21800000" />
+        <register type="NOA" address="0x00009888" value="0x31800000" />
+        <register type="NOA" address="0x00009888" value="0x3F800421" />
+        <register type="NOA" address="0x00009888" value="0x41800000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+    </register_config>
+    <register_config type="NOA"
+                     availability="$SubsliceMask 0x10 AND"
+                     priority="3"
+                     >
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x10DC00E0" />
+        <register type="NOA" address="0x00009888" value="0x14DB0160" />
+        <register type="NOA" address="0x00009888" value="0x16DB2800" />
+        <register type="NOA" address="0x00009888" value="0x18DB0120" />
+        <register type="NOA" address="0x00009888" value="0x0EDC25C1" />
+        <register type="NOA" address="0x00009888" value="0x00DC6100" />
+        <register type="NOA" address="0x00009888" value="0x02DC204C" />
+        <register type="NOA" address="0x00009888" value="0x06DC8000" />
+        <register type="NOA" address="0x00009888" value="0x08DCC000" />
+        <register type="NOA" address="0x00009888" value="0x0ADCC000" />
+        <register type="NOA" address="0x00009888" value="0x0CDCC000" />
+        <register type="NOA" address="0x00009888" value="0x04DCC000" />
+        <register type="NOA" address="0x00009888" value="0x00DB0011" />
+        <register type="NOA" address="0x00009888" value="0x06DB0900" />
+        <register type="NOA" address="0x00009888" value="0x08DB0A13" />
+        <register type="NOA" address="0x00009888" value="0x0ADB0B15" />
+        <register type="NOA" address="0x00009888" value="0x0CDB2317" />
+        <register type="NOA" address="0x00009888" value="0x04DB21B7" />
+        <register type="NOA" address="0x00009888" value="0x10DB0000" />
+        <register type="NOA" address="0x00009888" value="0x0EDB0000" />
+        <register type="NOA" address="0x00009888" value="0x1ADB0000" />
+        <register type="NOA" address="0x00009888" value="0x0C9FA800" />
+        <register type="NOA" address="0x00009888" value="0x0E9FAA2A" />
+        <register type="NOA" address="0x00009888" value="0x109F02AA" />
+        <register type="NOA" address="0x00009888" value="0x00B84000" />
+        <register type="NOA" address="0x00009888" value="0x0EB84000" />
+        <register type="NOA" address="0x00009888" value="0x16B84000" />
+        <register type="NOA" address="0x00009888" value="0x18B81555" />
+        <register type="NOA" address="0x00009888" value="0x02B84000" />
+        <register type="NOA" address="0x00009888" value="0x04B84000" />
+        <register type="NOA" address="0x00009888" value="0x06B84000" />
+        <register type="NOA" address="0x00009888" value="0x08B84000" />
+        <register type="NOA" address="0x00009888" value="0x0AB84000" />
+        <register type="NOA" address="0x00009888" value="0x00B9A000" />
+        <register type="NOA" address="0x00009888" value="0x06B98000" />
+        <register type="NOA" address="0x00009888" value="0x08B9A000" />
+        <register type="NOA" address="0x00009888" value="0x0AB9A000" />
+        <register type="NOA" address="0x00009888" value="0x0CB9A000" />
+        <register type="NOA" address="0x00009888" value="0x0EB9A000" />
+        <register type="NOA" address="0x00009888" value="0x02B9A000" />
+        <register type="NOA" address="0x00009888" value="0x04B9A000" />
+        <register type="NOA" address="0x00009888" value="0x01888000" />
+        <register type="NOA" address="0x00009888" value="0x0D88F800" />
+        <register type="NOA" address="0x00009888" value="0x0F88000F" />
+        <register type="NOA" address="0x00009888" value="0x03888000" />
+        <register type="NOA" address="0x00009888" value="0x05888000" />
+        <register type="NOA" address="0x00009888" value="0x07888000" />
+        <register type="NOA" address="0x00009888" value="0x09888000" />
+        <register type="NOA" address="0x00009888" value="0x0B888000" />
+        <register type="NOA" address="0x00009888" value="0x238B5540" />
+        <register type="NOA" address="0x00009888" value="0x258BAAA2" />
+        <register type="NOA" address="0x00009888" value="0x278B002A" />
+        <register type="NOA" address="0x00009888" value="0x018C4000" />
+        <register type="NOA" address="0x00009888" value="0x0F8C4000" />
+        <register type="NOA" address="0x00009888" value="0x178C2000" />
+        <register type="NOA" address="0x00009888" value="0x198C5500" />
+        <register type="NOA" address="0x00009888" value="0x1B8C0015" />
+        <register type="NOA" address="0x00009888" value="0x038C4000" />
+        <register type="NOA" address="0x00009888" value="0x058C4000" />
+        <register type="NOA" address="0x00009888" value="0x078C4000" />
+        <register type="NOA" address="0x00009888" value="0x098C4000" />
+        <register type="NOA" address="0x00009888" value="0x0B8C4000" />
+        <register type="NOA" address="0x00009888" value="0x018DA000" />
+        <register type="NOA" address="0x00009888" value="0x078D8000" />
+        <register type="NOA" address="0x00009888" value="0x098DA000" />
+        <register type="NOA" address="0x00009888" value="0x0B8DA000" />
+        <register type="NOA" address="0x00009888" value="0x0D8DA000" />
+        <register type="NOA" address="0x00009888" value="0x0F8DA000" />
+        <register type="NOA" address="0x00009888" value="0x038DA000" />
+        <register type="NOA" address="0x00009888" value="0x058DA000" />
+        <register type="NOA" address="0x00009888" value="0x1F85AA80" />
+        <register type="NOA" address="0x00009888" value="0x2185AAA2" />
+        <register type="NOA" address="0x00009888" value="0x2385002A" />
+        <register type="NOA" address="0x00009888" value="0x01834000" />
+        <register type="NOA" address="0x00009888" value="0x0F834000" />
+        <register type="NOA" address="0x00009888" value="0x19835400" />
+        <register type="NOA" address="0x00009888" value="0x1B830155" />
+        <register type="NOA" address="0x00009888" value="0x03834000" />
+        <register type="NOA" address="0x00009888" value="0x05834000" />
+        <register type="NOA" address="0x00009888" value="0x07834000" />
+        <register type="NOA" address="0x00009888" value="0x09834000" />
+        <register type="NOA" address="0x00009888" value="0x0B834000" />
+        <register type="NOA" address="0x00009888" value="0x0184C000" />
+        <register type="NOA" address="0x00009888" value="0x07848000" />
+        <register type="NOA" address="0x00009888" value="0x0984C000" />
+        <register type="NOA" address="0x00009888" value="0x0B84C000" />
+        <register type="NOA" address="0x00009888" value="0x0D84C000" />
+        <register type="NOA" address="0x00009888" value="0x0F84C000" />
+        <register type="NOA" address="0x00009888" value="0x0384C000" />
+        <register type="NOA" address="0x00009888" value="0x0584C000" />
+        <register type="NOA" address="0x00009888" value="0x1180C000" />
+        <register type="NOA" address="0x00009888" value="0x17808000" />
+        <register type="NOA" address="0x00009888" value="0x1980C000" />
+        <register type="NOA" address="0x00009888" value="0x1B80C000" />
+        <register type="NOA" address="0x00009888" value="0x1D80C000" />
+        <register type="NOA" address="0x00009888" value="0x1F80C000" />
+        <register type="NOA" address="0x00009888" value="0x1380C000" />
+        <register type="NOA" address="0x00009888" value="0x1580C000" />
+        <register type="NOA" address="0x00000D24" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x4D800000" />
+        <register type="NOA" address="0x00009888" value="0x3D800000" />
+        <register type="NOA" address="0x00009888" value="0x4F800000" />
+        <register type="NOA" address="0x00009888" value="0x43800000" />
+        <register type="NOA" address="0x00009888" value="0x51800000" />
+        <register type="NOA" address="0x00009888" value="0x45800000" />
+        <register type="NOA" address="0x00009888" value="0x53800000" />
+        <register type="NOA" address="0x00009888" value="0x47800420" />
+        <register type="NOA" address="0x00009888" value="0x21800000" />
+        <register type="NOA" address="0x00009888" value="0x31800000" />
+        <register type="NOA" address="0x00009888" value="0x3F800421" />
+        <register type="NOA" address="0x00009888" value="0x41800000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+    </register_config>
+    <register_config type="NOA"
+                     availability="$SubsliceMask 0x20 AND"
+                     priority="5"
+                     >
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x10B800E0" />
+        <register type="NOA" address="0x00009888" value="0x14BA0160" />
+        <register type="NOA" address="0x00009888" value="0x16BA2800" />
+        <register type="NOA" address="0x00009888" value="0x18BA0120" />
+        <register type="NOA" address="0x00009888" value="0x0C9FA800" />
+        <register type="NOA" address="0x00009888" value="0x0E9FAA2A" />
+        <register type="NOA" address="0x00009888" value="0x109F02AA" />
+        <register type="NOA" address="0x00009888" value="0x0EB8A5C1" />
+        <register type="NOA" address="0x00009888" value="0x00B8A100" />
+        <register type="NOA" address="0x00009888" value="0x02B8204C" />
+        <register type="NOA" address="0x00009888" value="0x16B88000" />
+        <register type="NOA" address="0x00009888" value="0x18B802AA" />
+        <register type="NOA" address="0x00009888" value="0x04B80000" />
+        <register type="NOA" address="0x00009888" value="0x06B80000" />
+        <register type="NOA" address="0x00009888" value="0x08B88000" />
+        <register type="NOA" address="0x00009888" value="0x0AB88000" />
+        <register type="NOA" address="0x00009888" value="0x00B9A000" />
+        <register type="NOA" address="0x00009888" value="0x06B98000" />
+        <register type="NOA" address="0x00009888" value="0x08B9A000" />
+        <register type="NOA" address="0x00009888" value="0x0AB9A000" />
+        <register type="NOA" address="0x00009888" value="0x0CB9A000" />
+        <register type="NOA" address="0x00009888" value="0x0EB9A000" />
+        <register type="NOA" address="0x00009888" value="0x02B9A000" />
+        <register type="NOA" address="0x00009888" value="0x04B9A000" />
+        <register type="NOA" address="0x00009888" value="0x00BA0011" />
+        <register type="NOA" address="0x00009888" value="0x06BA0900" />
+        <register type="NOA" address="0x00009888" value="0x08BA0A13" />
+        <register type="NOA" address="0x00009888" value="0x0ABA0B15" />
+        <register type="NOA" address="0x00009888" value="0x0CBA2317" />
+        <register type="NOA" address="0x00009888" value="0x04BA21B7" />
+        <register type="NOA" address="0x00009888" value="0x10BA0000" />
+        <register type="NOA" address="0x00009888" value="0x0EBA0000" />
+        <register type="NOA" address="0x00009888" value="0x1ABA0000" />
+        <register type="NOA" address="0x00009888" value="0x01888000" />
+        <register type="NOA" address="0x00009888" value="0x0D88F800" />
+        <register type="NOA" address="0x00009888" value="0x0F88000F" />
+        <register type="NOA" address="0x00009888" value="0x03888000" />
+        <register type="NOA" address="0x00009888" value="0x05888000" />
+        <register type="NOA" address="0x00009888" value="0x07888000" />
+        <register type="NOA" address="0x00009888" value="0x09888000" />
+        <register type="NOA" address="0x00009888" value="0x0B888000" />
+        <register type="NOA" address="0x00009888" value="0x238B5540" />
+        <register type="NOA" address="0x00009888" value="0x258BAAA2" />
+        <register type="NOA" address="0x00009888" value="0x278B002A" />
+        <register type="NOA" address="0x00009888" value="0x018C4000" />
+        <register type="NOA" address="0x00009888" value="0x0F8C4000" />
+        <register type="NOA" address="0x00009888" value="0x178C2000" />
+        <register type="NOA" address="0x00009888" value="0x198C5500" />
+        <register type="NOA" address="0x00009888" value="0x1B8C0015" />
+        <register type="NOA" address="0x00009888" value="0x038C4000" />
+        <register type="NOA" address="0x00009888" value="0x058C4000" />
+        <register type="NOA" address="0x00009888" value="0x078C4000" />
+        <register type="NOA" address="0x00009888" value="0x098C4000" />
+        <register type="NOA" address="0x00009888" value="0x0B8C4000" />
+        <register type="NOA" address="0x00009888" value="0x018DA000" />
+        <register type="NOA" address="0x00009888" value="0x078D8000" />
+        <register type="NOA" address="0x00009888" value="0x098DA000" />
+        <register type="NOA" address="0x00009888" value="0x0B8DA000" />
+        <register type="NOA" address="0x00009888" value="0x0D8DA000" />
+        <register type="NOA" address="0x00009888" value="0x0F8DA000" />
+        <register type="NOA" address="0x00009888" value="0x038DA000" />
+        <register type="NOA" address="0x00009888" value="0x058DA000" />
+        <register type="NOA" address="0x00009888" value="0x1F85AA80" />
+        <register type="NOA" address="0x00009888" value="0x2185AAA2" />
+        <register type="NOA" address="0x00009888" value="0x2385002A" />
+        <register type="NOA" address="0x00009888" value="0x01834000" />
+        <register type="NOA" address="0x00009888" value="0x0F834000" />
+        <register type="NOA" address="0x00009888" value="0x19835400" />
+        <register type="NOA" address="0x00009888" value="0x1B830155" />
+        <register type="NOA" address="0x00009888" value="0x03834000" />
+        <register type="NOA" address="0x00009888" value="0x05834000" />
+        <register type="NOA" address="0x00009888" value="0x07834000" />
+        <register type="NOA" address="0x00009888" value="0x09834000" />
+        <register type="NOA" address="0x00009888" value="0x0B834000" />
+        <register type="NOA" address="0x00009888" value="0x0184C000" />
+        <register type="NOA" address="0x00009888" value="0x07848000" />
+        <register type="NOA" address="0x00009888" value="0x0984C000" />
+        <register type="NOA" address="0x00009888" value="0x0B84C000" />
+        <register type="NOA" address="0x00009888" value="0x0D84C000" />
+        <register type="NOA" address="0x00009888" value="0x0F84C000" />
+        <register type="NOA" address="0x00009888" value="0x0384C000" />
+        <register type="NOA" address="0x00009888" value="0x0584C000" />
+        <register type="NOA" address="0x00009888" value="0x1180C000" />
+        <register type="NOA" address="0x00009888" value="0x17808000" />
+        <register type="NOA" address="0x00009888" value="0x1980C000" />
+        <register type="NOA" address="0x00009888" value="0x1B80C000" />
+        <register type="NOA" address="0x00009888" value="0x1D80C000" />
+        <register type="NOA" address="0x00009888" value="0x1F80C000" />
+        <register type="NOA" address="0x00009888" value="0x1380C000" />
+        <register type="NOA" address="0x00009888" value="0x1580C000" />
+        <register type="NOA" address="0x00000D24" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x4D800000" />
+        <register type="NOA" address="0x00009888" value="0x3D800000" />
+        <register type="NOA" address="0x00009888" value="0x4F800000" />
+        <register type="NOA" address="0x00009888" value="0x43800000" />
+        <register type="NOA" address="0x00009888" value="0x51800000" />
+        <register type="NOA" address="0x00009888" value="0x45800000" />
+        <register type="NOA" address="0x00009888" value="0x53800000" />
+        <register type="NOA" address="0x00009888" value="0x47800420" />
+        <register type="NOA" address="0x00009888" value="0x21800000" />
+        <register type="NOA" address="0x00009888" value="0x31800000" />
+        <register type="NOA" address="0x00009888" value="0x3F800421" />
+        <register type="NOA" address="0x00009888" value="0x41800000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007FC2A" />
+        <register type="OA" address="0x00002774" value="0x0000BF00" />
+        <register type="OA" address="0x00002778" value="0x0007FC6A" />
+        <register type="OA" address="0x0000277C" value="0x0000BF00" />
+        <register type="OA" address="0x00002780" value="0x0007FC92" />
+        <register type="OA" address="0x00002784" value="0x0000BF00" />
+        <register type="OA" address="0x00002788" value="0x0007FCA2" />
+        <register type="OA" address="0x0000278C" value="0x0000BF00" />
+        <register type="OA" address="0x00002790" value="0x0007FC32" />
+        <register type="OA" address="0x00002794" value="0x0000BF00" />
+        <register type="OA" address="0x00002798" value="0x0007FC9A" />
+        <register type="OA" address="0x0000279C" value="0x0000BF00" />
+        <register type="OA" address="0x000027A0" value="0x0007FE6A" />
+        <register type="OA" address="0x000027A4" value="0x0000BF00" />
+        <register type="OA" address="0x000027A8" value="0x0007FE7A" />
+        <register type="OA" address="0x000027AC" value="0x0000BF00" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00000003" />
+        <register type="FLEX" address="0x0000E658" value="0x00002001" />
+        <register type="FLEX" address="0x0000E758" value="0x00778008" />
+        <register type="FLEX" address="0x0000E45C" value="0x00088078" />
+        <register type="FLEX" address="0x0000E55C" value="0x00808708" />
+        <register type="FLEX" address="0x0000E65C" value="0x00A08908" />
+    </register_config>
+  </set>
+
+  <set name="Compute Metrics L3 Cache Gen8"
+       mdapi_supported_apis="VK OGL4 OCL IO BB"
+       underscore_name="compute_l3_cache"
+       hw_config_guid="27a364dc-8225-4ecb-b607-d6f1925598d9"
+       chipset="BDW"
+       symbol_name="ComputeL3Cache"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Bank 03 Accesses"
+             description="The total number of accesses to L3 Bank 03."
+             data_type="uint64"
+             equation="B 3 READ 2 UMUL"
+             underscore_name="l3_bank03_accesses"
+             units="messages"
+             symbol_name="L3Bank03Accesses"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="L3 Accesses"
+             description="The total number of L3 accesses from all entities."
+             data_type="uint64"
+             equation="C 0 READ C 1 READ B 2 READ B 3 READ C 2 READ C 3 READ B 6 READ B 7 READ UADD UADD UADD UADD UADD UADD UADD 2 UMUL"
+             underscore_name="l3_accesses"
+             units="messages"
+             symbol_name="L3Accesses"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Total Throughput"
+             description="The total number of GPU memory bytes transferred via L3."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="$L3Accesses 64 UMUL"
+             underscore_name="l3_total_throughput"
+             units="bytes"
+             symbol_name="L3TotalThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu0_active"
+             units="percent"
+             symbol_name="Fpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OCL OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active"
+             units="percent"
+             symbol_name="Fpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OCL OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU AVG IPC Rate"
+             description="The average rate of IPC calculated for 2 FPU pipelines."
+             data_type="float"
+             max_equation="2"
+             equation="A 9 READ  A 10 READ  A 11 READ UADD  A 9 READ USUB FDIV 1 FADD"
+             underscore_name="eu_avg_ipc_rate"
+             units="number"
+             symbol_name="EuAvgIpcRate"
+             semantic_type="ratio"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Binary Instruction"
+             description="The percentage of time in which execution units were actively processing binary instructions on FPU0."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_binary_fpu0_instruction"
+             units="percent"
+             symbol_name="EuBinaryFpu0Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="EU FPU0 Hybrid Instruction"
+             description="The percentage of time in which execution units were actively processing hybrid instructions on FPU0."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_hybrid_fpu0_instruction"
+             units="percent"
+             symbol_name="EuHybridFpu0Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Misses"
+             description="The total number of L3 misses."
+             data_type="uint64"
+             equation="C 4 READ C 5 READ UADD"
+             underscore_name="l3_misses"
+             units="messages"
+             symbol_name="L3Misses"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/TAG"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="L3 Bank 00 Accesses"
+             description="The total number of accesses to L3 Bank 00."
+             data_type="uint64"
+             equation="C 0 READ 2 UMUL"
+             underscore_name="l3_bank00_accesses"
+             units="messages"
+             symbol_name="L3Bank00Accesses"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="EU FPU0 Move Instruction"
+             description="The percentage of time in which execution units were actively processing move instructions on FPU0."
+             data_type="float"
+             max_equation="100"
+             equation="A 19 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_move_fpu0_instruction"
+             units="percent"
+             symbol_name="EuMoveFpu0Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="L3 Bank 10 Accesses"
+             description="The total number of accesses to L3 Bank 10."
+             data_type="uint64"
+             equation="C 2 READ 2 UMUL"
+             underscore_name="l3_bank10_accesses"
+             units="messages"
+             symbol_name="L3Bank10Accesses"
+             availability="$SliceMask 0x02 AND"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="EU FPU1 Hybrid Instruction"
+             description="The percentage of time in which execution units were actively processing hybrid instructions on FPU1."
+             data_type="float"
+             max_equation="100"
+             equation="A 14 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_hybrid_fpu1_instruction"
+             units="percent"
+             symbol_name="EuHybridFpu1Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Bank 10 IC Accesses"
+             description="The total number of accesses to L3 Bank 10 from IC cache."
+             data_type="uint64"
+             equation="B 4 READ B 5 READ UADD 2 UMUL $L3Bank10Accesses UMIN"
+             underscore_name="l3_bank10_ic_accesses"
+             units="messages"
+             symbol_name="L3Bank10IcAccesses"
+             availability="$SliceMask 0x02 AND"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3/IC"
+             />
+    <counter name="L3 Bank 10 IC Hits"
+             description="The total number of hits in L3 Bank 10 from IC cache."
+             data_type="uint64"
+             equation="B 5 READ 2 UMUL $L3Bank10IcAccesses UMIN"
+             underscore_name="l3_bank10_ic_hits"
+             units="messages"
+             symbol_name="L3Bank10IcHits"
+             availability="$SliceMask 0x02 AND"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3/IC"
+             />
+    <counter name="GTI Read Throughput"
+             description="The total number of GPU memory bytes read from GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="C 6 READ 64 UMUL"
+             underscore_name="gti_read_throughput"
+             units="bytes"
+             symbol_name="GtiReadThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI L3 Throughput"
+             description="The total number of GPU memory bytes transferred between L3 caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 4 READ C 5 READ UADD 64 UMUL"
+             underscore_name="gti_l3_throughput"
+             units="bytes"
+             symbol_name="GtiL3Throughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Bank 00 IC Accesses"
+             description="The total number of accesses to L3 Bank 00 from IC cache."
+             data_type="uint64"
+             equation="B 0 READ B 1 READ UADD 2 UMUL $L3Bank00Accesses UMIN"
+             underscore_name="l3_bank00_ic_accesses"
+             units="messages"
+             symbol_name="L3Bank00IcAccesses"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3/IC"
+             />
+    <counter name="L3 Bank 00 IC Hits"
+             description="The total number of hits in L3 Bank 00 from IC cache."
+             data_type="uint64"
+             equation="B 1 READ 2 UMUL $L3Bank00IcAccesses UMIN"
+             underscore_name="l3_bank00_ic_hits"
+             units="messages"
+             symbol_name="L3Bank00IcHits"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3/IC"
+             />
+    <counter name="L3 Bank 01 Accesses"
+             description="The total number of accesses to L3 Bank 01."
+             data_type="uint64"
+             equation="C 1 READ 2 UMUL"
+             underscore_name="l3_bank01_accesses"
+             units="messages"
+             symbol_name="L3Bank01Accesses"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Ternary Instruction"
+             description="The percentage of time in which execution units were actively processing ternary instructions on FPU0."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_ternary_fpu0_instruction"
+             units="percent"
+             symbol_name="EuTernaryFpu0Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU FPU1 Move Instruction"
+             description="The percentage of time in which execution units were actively processing move instructions on FPU1."
+             data_type="float"
+             max_equation="100"
+             equation="A 20 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_move_fpu1_instruction"
+             units="percent"
+             symbol_name="EuMoveFpu1Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="L3 Bank 11 Accesses"
+             description="The total number of accesses to L3 Bank 11."
+             data_type="uint64"
+             equation="C 3 READ 2 UMUL"
+             underscore_name="l3_bank11_accesses"
+             units="messages"
+             symbol_name="L3Bank11Accesses"
+             availability="$SliceMask 0x02 AND"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="L3 Bank 02 Accesses"
+             description="The total number of accesses to L3 Bank 02."
+             data_type="uint64"
+             equation="B 2 READ 2 UMUL"
+             underscore_name="l3_bank02_accesses"
+             units="messages"
+             symbol_name="L3Bank02Accesses"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="L3 Bank 13 Accesses"
+             description="The total number of accesses to L3 Bank 13."
+             data_type="uint64"
+             equation="B 7 READ 2 UMUL"
+             underscore_name="l3_bank13_accesses"
+             units="messages"
+             symbol_name="L3Bank13Accesses"
+             availability="$SliceMask 0x02 AND"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="GTI Write Throughput"
+             description="The total number of GPU memory bytes written to GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 32 UMUL"
+             equation="C 7 READ 64 UMUL"
+             underscore_name="gti_write_throughput"
+             units="bytes"
+             symbol_name="GtiWriteThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL 2 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses UADD UADD 64 UMUL"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="L3 Bank 12 Accesses"
+             description="The total number of accesses to L3 Bank 12."
+             data_type="uint64"
+             equation="B 6 READ 2 UMUL"
+             underscore_name="l3_bank12_accesses"
+             units="messages"
+             symbol_name="L3Bank12Accesses"
+             availability="$SliceMask 0x02 AND"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="EU FPU1 Binary Instruction"
+             description="The percentage of time in which execution units were actively processing binary instructions on FPU1."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_binary_fpu1_instruction"
+             units="percent"
+             symbol_name="EuBinaryFpu1Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Ternary Instruction"
+             description="The percentage of time in which execution units were actively processing ternary instructions on FPU1."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_ternary_fpu1_instruction"
+             units="percent"
+             symbol_name="EuTernaryFpu1Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_send_active"
+             units="percent"
+             symbol_name="EuSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x143F00B3" />
+        <register type="NOA" address="0x00009888" value="0x14BF00B3" />
+        <register type="NOA" address="0x00009888" value="0x138303C0" />
+        <register type="NOA" address="0x00009888" value="0x3B800060" />
+        <register type="NOA" address="0x00009888" value="0x3D800805" />
+        <register type="NOA" address="0x00009888" value="0x003F0029" />
+        <register type="NOA" address="0x00009888" value="0x063F1400" />
+        <register type="NOA" address="0x00009888" value="0x083F1225" />
+        <register type="NOA" address="0x00009888" value="0x0E3F1327" />
+        <register type="NOA" address="0x00009888" value="0x103F0000" />
+        <register type="NOA" address="0x00009888" value="0x005A4000" />
+        <register type="NOA" address="0x00009888" value="0x065A8000" />
+        <register type="NOA" address="0x00009888" value="0x085AC000" />
+        <register type="NOA" address="0x00009888" value="0x0E5AC000" />
+        <register type="NOA" address="0x00009888" value="0x001D4000" />
+        <register type="NOA" address="0x00009888" value="0x061D8000" />
+        <register type="NOA" address="0x00009888" value="0x081DC000" />
+        <register type="NOA" address="0x00009888" value="0x0E1DC000" />
+        <register type="NOA" address="0x00009888" value="0x0C1F0800" />
+        <register type="NOA" address="0x00009888" value="0x0E1F2A00" />
+        <register type="NOA" address="0x00009888" value="0x101F0280" />
+        <register type="NOA" address="0x00009888" value="0x00391000" />
+        <register type="NOA" address="0x00009888" value="0x06394000" />
+        <register type="NOA" address="0x00009888" value="0x08395000" />
+        <register type="NOA" address="0x00009888" value="0x0E395000" />
+        <register type="NOA" address="0x00009888" value="0x0ABF1429" />
+        <register type="NOA" address="0x00009888" value="0x0CBF1225" />
+        <register type="NOA" address="0x00009888" value="0x00BF1380" />
+        <register type="NOA" address="0x00009888" value="0x02BF0026" />
+        <register type="NOA" address="0x00009888" value="0x10BF0000" />
+        <register type="NOA" address="0x00009888" value="0x0ADAC000" />
+        <register type="NOA" address="0x00009888" value="0x0CDAC000" />
+        <register type="NOA" address="0x00009888" value="0x00DA8000" />
+        <register type="NOA" address="0x00009888" value="0x02DA4000" />
+        <register type="NOA" address="0x00009888" value="0x0A9DC000" />
+        <register type="NOA" address="0x00009888" value="0x0C9DC000" />
+        <register type="NOA" address="0x00009888" value="0x009D8000" />
+        <register type="NOA" address="0x00009888" value="0x029D4000" />
+        <register type="NOA" address="0x00009888" value="0x0E9F8000" />
+        <register type="NOA" address="0x00009888" value="0x109F002A" />
+        <register type="NOA" address="0x00009888" value="0x0C9FA000" />
+        <register type="NOA" address="0x00009888" value="0x0AB95000" />
+        <register type="NOA" address="0x00009888" value="0x0CB95000" />
+        <register type="NOA" address="0x00009888" value="0x00B94000" />
+        <register type="NOA" address="0x00009888" value="0x02B91000" />
+        <register type="NOA" address="0x00009888" value="0x0D88C000" />
+        <register type="NOA" address="0x00009888" value="0x0F880003" />
+        <register type="NOA" address="0x00009888" value="0x03888000" />
+        <register type="NOA" address="0x00009888" value="0x05888000" />
+        <register type="NOA" address="0x00009888" value="0x018A8000" />
+        <register type="NOA" address="0x00009888" value="0x0F8A8000" />
+        <register type="NOA" address="0x00009888" value="0x198A8000" />
+        <register type="NOA" address="0x00009888" value="0x1B8A8020" />
+        <register type="NOA" address="0x00009888" value="0x1D8A0002" />
+        <register type="NOA" address="0x00009888" value="0x238B0520" />
+        <register type="NOA" address="0x00009888" value="0x258BA950" />
+        <register type="NOA" address="0x00009888" value="0x278B0016" />
+        <register type="NOA" address="0x00009888" value="0x198C5400" />
+        <register type="NOA" address="0x00009888" value="0x1B8C0001" />
+        <register type="NOA" address="0x00009888" value="0x038C4000" />
+        <register type="NOA" address="0x00009888" value="0x058C4000" />
+        <register type="NOA" address="0x00009888" value="0x0B8DA000" />
+        <register type="NOA" address="0x00009888" value="0x0D8DA000" />
+        <register type="NOA" address="0x00009888" value="0x018D8000" />
+        <register type="NOA" address="0x00009888" value="0x038D2000" />
+        <register type="NOA" address="0x00009888" value="0x1F85AA80" />
+        <register type="NOA" address="0x00009888" value="0x2185AAA0" />
+        <register type="NOA" address="0x00009888" value="0x2385002A" />
+        <register type="NOA" address="0x00009888" value="0x03835180" />
+        <register type="NOA" address="0x00009888" value="0x05834022" />
+        <register type="NOA" address="0x00009888" value="0x11830000" />
+        <register type="NOA" address="0x00009888" value="0x01834000" />
+        <register type="NOA" address="0x00009888" value="0x0F834000" />
+        <register type="NOA" address="0x00009888" value="0x19835400" />
+        <register type="NOA" address="0x00009888" value="0x1B830155" />
+        <register type="NOA" address="0x00009888" value="0x07830000" />
+        <register type="NOA" address="0x00009888" value="0x09830000" />
+        <register type="NOA" address="0x00009888" value="0x0184C000" />
+        <register type="NOA" address="0x00009888" value="0x07848000" />
+        <register type="NOA" address="0x00009888" value="0x0984C000" />
+        <register type="NOA" address="0x00009888" value="0x0B84C000" />
+        <register type="NOA" address="0x00009888" value="0x0D84C000" />
+        <register type="NOA" address="0x00009888" value="0x0F84C000" />
+        <register type="NOA" address="0x00009888" value="0x0384C000" />
+        <register type="NOA" address="0x00009888" value="0x05844000" />
+        <register type="NOA" address="0x00009888" value="0x1B80C137" />
+        <register type="NOA" address="0x00009888" value="0x1D80C147" />
+        <register type="NOA" address="0x00009888" value="0x21800000" />
+        <register type="NOA" address="0x00009888" value="0x1180C000" />
+        <register type="NOA" address="0x00009888" value="0x17808000" />
+        <register type="NOA" address="0x00009888" value="0x1980C000" />
+        <register type="NOA" address="0x00009888" value="0x1F80C000" />
+        <register type="NOA" address="0x00009888" value="0x1380C000" />
+        <register type="NOA" address="0x00009888" value="0x15804000" />
+        <register type="NOA" address="0x00000D24" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x4D801000" />
+        <register type="NOA" address="0x00009888" value="0x4F800111" />
+        <register type="NOA" address="0x00009888" value="0x43800842" />
+        <register type="NOA" address="0x00009888" value="0x51800000" />
+        <register type="NOA" address="0x00009888" value="0x45800000" />
+        <register type="NOA" address="0x00009888" value="0x53800000" />
+        <register type="NOA" address="0x00009888" value="0x47800840" />
+        <register type="NOA" address="0x00009888" value="0x31800000" />
+        <register type="NOA" address="0x00009888" value="0x3F800800" />
+        <register type="NOA" address="0x00009888" value="0x418014A2" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x30800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x30800000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007FFFA" />
+        <register type="OA" address="0x00002774" value="0x0000FEFE" />
+        <register type="OA" address="0x00002778" value="0x0007FFFA" />
+        <register type="OA" address="0x0000277C" value="0x0000FEFD" />
+        <register type="OA" address="0x00002790" value="0x0007FFFA" />
+        <register type="OA" address="0x00002794" value="0x0000FBEF" />
+        <register type="OA" address="0x00002798" value="0x0007FFFA" />
+        <register type="OA" address="0x0000279C" value="0x0000FBDF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00000003" />
+        <register type="FLEX" address="0x0000E658" value="0x00002001" />
+        <register type="FLEX" address="0x0000E758" value="0x00101100" />
+        <register type="FLEX" address="0x0000E45C" value="0x00201200" />
+        <register type="FLEX" address="0x0000E55C" value="0x00301300" />
+        <register type="FLEX" address="0x0000E65C" value="0x00401400" />
+    </register_config>
+  </set>
+
+  <set name="Data Port Reads Coalescing Gen8"
+       mdapi_supported_apis="VK OGL4 OCL IO BB"
+       underscore_name="data_port_reads_coalescing"
+       hw_config_guid="857fc630-2f09-4804-85f1-084adfadd5ab"
+       chipset="BDW"
+       symbol_name="DataPortReadsCoalescing"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu0_active"
+             units="percent"
+             symbol_name="Fpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active"
+             units="percent"
+             symbol_name="Fpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU AVG IPC Rate"
+             description="The average rate of IPC calculated for 2 FPU pipelines."
+             data_type="float"
+             max_equation="2"
+             equation="A 9 READ  A 10 READ  A 11 READ UADD  A 9 READ USUB FDIV 1 FADD"
+             underscore_name="eu_avg_ipc_rate"
+             units="number"
+             symbol_name="EuAvgIpcRate"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU to Data Port 0 Reads 64"
+             description="The subslice 0 EU data reads from Data Port with 64B per message."
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="eu_hdc0_reads64_b"
+             units="messages"
+             symbol_name="EuHdc0Reads64B"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Data Port 0 to L3 Data Reads"
+             description="The subslice 0 Data Port data and constant reads from L3 cache."
+             data_type="uint64"
+             equation="C 4 READ"
+             underscore_name="hdc0_l3_data_reads"
+             units="messages"
+             symbol_name="Hdc0L3DataReads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Data Port 0 to L3 Data Writes"
+             description="The subslice 0 Data Port data writes to L3 cache."
+             data_type="uint64"
+             equation="C 5 READ"
+             underscore_name="hdc0_l3_data_writes"
+             units="messages"
+             symbol_name="Hdc0L3DataWrites"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EU to Data Port 0 Reads 128"
+             description="The subslice 0 EU data reads from Data Port with 128B per message."
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="eu_hdc0_reads128_b"
+             units="messages"
+             symbol_name="EuHdc0Reads128B"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="EU Thread Occupancy"
+             description="The percentage of time in which hardware threads occupied EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ 8 UMUL $EuCoresTotalCount UDIV $EuThreadsCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_thread_occupancy"
+             units="percent"
+             symbol_name="EuThreadOccupancy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="All Data Port 0 Writes to L3"
+             description="The subslice 0 Data Port writes to L3 cache."
+             data_type="uint64"
+             equation="C 2 READ"
+             underscore_name="hdc0_l3_writes"
+             units="messages"
+             symbol_name="Hdc0L3Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU to Data Port 0 Reads 32"
+             description="The subslice 0 EU data reads from Data Port with 32B per message."
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="eu_hdc0_reads32_b"
+             units="messages"
+             symbol_name="EuHdc0Reads32B"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EU to Data Port 0 Reads 256"
+             description="The subslice 0 EU data reads from Data Port with 256B per message."
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="eu_hdc0_reads256_b"
+             units="messages"
+             symbol_name="EuHdc0Reads256B"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuBytesReadPerCacheLine"
+             description="Average EU bytes read per L3 cache line."
+             data_type="float"
+             equation="$EuHdc0Reads32B 32 UMUL $EuHdc0Reads64B 64 UMUL $EuHdc0Reads128B 128 UMUL $EuHdc0Reads256B 256 UMUL UADD UADD UADD $Hdc0L3DataReads FDIV"
+             underscore_name="eu_bytes_read_per_cache_line"
+             units="eu bytes per l3 cache line"
+             symbol_name="EuBytesReadPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuDataReadsPerCacheLine"
+             description="Coalescing ratio of EU read requests to L3 cache lines."
+             data_type="float"
+             equation="$EuBytesReadPerCacheLine 64 FDIV"
+             underscore_name="eu_data_reads_per_cache_line"
+             units="utilization"
+             symbol_name="EuDataReadsPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL 2 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses UADD UADD 64 UMUL"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="All Data Port 0 Reads from L3"
+             description="The subslice 0 Data Port reads from L3 cache."
+             data_type="uint64"
+             equation="C 3 READ C 2 READ USUB"
+             underscore_name="hdc0_l3_reads"
+             units="messages"
+             symbol_name="Hdc0L3Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="EU Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_send_active"
+             units="percent"
+             symbol_name="EuSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA"
+                     availability="$SubsliceMask 0x01 AND"
+                     priority="0"
+                     >
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x103D0005" />
+        <register type="NOA" address="0x00009888" value="0x163D240B" />
+        <register type="NOA" address="0x00009888" value="0x1058022F" />
+        <register type="NOA" address="0x00009888" value="0x185B5520" />
+        <register type="NOA" address="0x00009888" value="0x198B0003" />
+        <register type="NOA" address="0x00009888" value="0x005CC000" />
+        <register type="NOA" address="0x00009888" value="0x065CC000" />
+        <register type="NOA" address="0x00009888" value="0x085CC000" />
+        <register type="NOA" address="0x00009888" value="0x0A5CC000" />
+        <register type="NOA" address="0x00009888" value="0x0C5CC000" />
+        <register type="NOA" address="0x00009888" value="0x0E5CC000" />
+        <register type="NOA" address="0x00009888" value="0x025C4000" />
+        <register type="NOA" address="0x00009888" value="0x045C8000" />
+        <register type="NOA" address="0x00009888" value="0x003D0000" />
+        <register type="NOA" address="0x00009888" value="0x063D00B0" />
+        <register type="NOA" address="0x00009888" value="0x083D0182" />
+        <register type="NOA" address="0x00009888" value="0x0A3D10A0" />
+        <register type="NOA" address="0x00009888" value="0x0C3D11A2" />
+        <register type="NOA" address="0x00009888" value="0x0E3D0000" />
+        <register type="NOA" address="0x00009888" value="0x183D0000" />
+        <register type="NOA" address="0x00009888" value="0x1A3D0000" />
+        <register type="NOA" address="0x00009888" value="0x0E582242" />
+        <register type="NOA" address="0x00009888" value="0x00586700" />
+        <register type="NOA" address="0x00009888" value="0x0258004F" />
+        <register type="NOA" address="0x00009888" value="0x0658C000" />
+        <register type="NOA" address="0x00009888" value="0x0858C000" />
+        <register type="NOA" address="0x00009888" value="0x0A58C000" />
+        <register type="NOA" address="0x00009888" value="0x0C58C000" />
+        <register type="NOA" address="0x00009888" value="0x045B6300" />
+        <register type="NOA" address="0x00009888" value="0x105B0000" />
+        <register type="NOA" address="0x00009888" value="0x005B4000" />
+        <register type="NOA" address="0x00009888" value="0x0E5B4000" />
+        <register type="NOA" address="0x00009888" value="0x1A5B0155" />
+        <register type="NOA" address="0x00009888" value="0x025B4000" />
+        <register type="NOA" address="0x00009888" value="0x0A5B0000" />
+        <register type="NOA" address="0x00009888" value="0x0C5B4000" />
+        <register type="NOA" address="0x00009888" value="0x0C1FA800" />
+        <register type="NOA" address="0x00009888" value="0x0E1FAAA0" />
+        <register type="NOA" address="0x00009888" value="0x101F02AA" />
+        <register type="NOA" address="0x00009888" value="0x00384000" />
+        <register type="NOA" address="0x00009888" value="0x0E384000" />
+        <register type="NOA" address="0x00009888" value="0x16384000" />
+        <register type="NOA" address="0x00009888" value="0x18381555" />
+        <register type="NOA" address="0x00009888" value="0x02384000" />
+        <register type="NOA" address="0x00009888" value="0x04384000" />
+        <register type="NOA" address="0x00009888" value="0x0A384000" />
+        <register type="NOA" address="0x00009888" value="0x0C384000" />
+        <register type="NOA" address="0x00009888" value="0x0039A000" />
+        <register type="NOA" address="0x00009888" value="0x0639A000" />
+        <register type="NOA" address="0x00009888" value="0x0839A000" />
+        <register type="NOA" address="0x00009888" value="0x0A39A000" />
+        <register type="NOA" address="0x00009888" value="0x0C39A000" />
+        <register type="NOA" address="0x00009888" value="0x0E39A000" />
+        <register type="NOA" address="0x00009888" value="0x02392000" />
+        <register type="NOA" address="0x00009888" value="0x04398000" />
+        <register type="NOA" address="0x00009888" value="0x018A8000" />
+        <register type="NOA" address="0x00009888" value="0x0F8A8000" />
+        <register type="NOA" address="0x00009888" value="0x198A8000" />
+        <register type="NOA" address="0x00009888" value="0x1B8AAAA0" />
+        <register type="NOA" address="0x00009888" value="0x1D8A0002" />
+        <register type="NOA" address="0x00009888" value="0x038A8000" />
+        <register type="NOA" address="0x00009888" value="0x058A8000" />
+        <register type="NOA" address="0x00009888" value="0x0B8A8000" />
+        <register type="NOA" address="0x00009888" value="0x0D8A8000" />
+        <register type="NOA" address="0x00009888" value="0x038B6300" />
+        <register type="NOA" address="0x00009888" value="0x058B0062" />
+        <register type="NOA" address="0x00009888" value="0x118B0000" />
+        <register type="NOA" address="0x00009888" value="0x238B02A0" />
+        <register type="NOA" address="0x00009888" value="0x258B5555" />
+        <register type="NOA" address="0x00009888" value="0x278B0015" />
+        <register type="NOA" address="0x00009888" value="0x1F85AA80" />
+        <register type="NOA" address="0x00009888" value="0x2185AAAA" />
+        <register type="NOA" address="0x00009888" value="0x2385002A" />
+        <register type="NOA" address="0x00009888" value="0x01834000" />
+        <register type="NOA" address="0x00009888" value="0x0F834000" />
+        <register type="NOA" address="0x00009888" value="0x19835400" />
+        <register type="NOA" address="0x00009888" value="0x1B830155" />
+        <register type="NOA" address="0x00009888" value="0x03834000" />
+        <register type="NOA" address="0x00009888" value="0x05834000" />
+        <register type="NOA" address="0x00009888" value="0x07834000" />
+        <register type="NOA" address="0x00009888" value="0x09834000" />
+        <register type="NOA" address="0x00009888" value="0x0B834000" />
+        <register type="NOA" address="0x00009888" value="0x0D834000" />
+        <register type="NOA" address="0x00009888" value="0x0184C000" />
+        <register type="NOA" address="0x00009888" value="0x0784C000" />
+        <register type="NOA" address="0x00009888" value="0x0984C000" />
+        <register type="NOA" address="0x00009888" value="0x0B84C000" />
+        <register type="NOA" address="0x00009888" value="0x0D84C000" />
+        <register type="NOA" address="0x00009888" value="0x0F84C000" />
+        <register type="NOA" address="0x00009888" value="0x0384C000" />
+        <register type="NOA" address="0x00009888" value="0x0584C000" />
+        <register type="NOA" address="0x00009888" value="0x1180C000" />
+        <register type="NOA" address="0x00009888" value="0x1780C000" />
+        <register type="NOA" address="0x00009888" value="0x1980C000" />
+        <register type="NOA" address="0x00009888" value="0x1B80C000" />
+        <register type="NOA" address="0x00009888" value="0x1D80C000" />
+        <register type="NOA" address="0x00009888" value="0x1F80C000" />
+        <register type="NOA" address="0x00009888" value="0x1380C000" />
+        <register type="NOA" address="0x00009888" value="0x1580C000" />
+        <register type="NOA" address="0x00000D24" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x4D801000" />
+        <register type="NOA" address="0x00009888" value="0x3D800000" />
+        <register type="NOA" address="0x00009888" value="0x4F800001" />
+        <register type="NOA" address="0x00009888" value="0x43800000" />
+        <register type="NOA" address="0x00009888" value="0x51800000" />
+        <register type="NOA" address="0x00009888" value="0x45800000" />
+        <register type="NOA" address="0x00009888" value="0x53800000" />
+        <register type="NOA" address="0x00009888" value="0x47800420" />
+        <register type="NOA" address="0x00009888" value="0x21800000" />
+        <register type="NOA" address="0x00009888" value="0x31800000" />
+        <register type="NOA" address="0x00009888" value="0x3F800421" />
+        <register type="NOA" address="0x00009888" value="0x41800041" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x0000274C" value="0xBA98BA98" />
+        <register type="OA" address="0x00002748" value="0xBA98BA98" />
+        <register type="OA" address="0x00002744" value="0x00003377" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007FFF2" />
+        <register type="OA" address="0x00002774" value="0x00007FF0" />
+        <register type="OA" address="0x00002778" value="0x0007FFE2" />
+        <register type="OA" address="0x0000277C" value="0x00007FF0" />
+        <register type="OA" address="0x00002780" value="0x0007FFC2" />
+        <register type="OA" address="0x00002784" value="0x00007FF0" />
+        <register type="OA" address="0x00002788" value="0x0007FF82" />
+        <register type="OA" address="0x0000278C" value="0x00007FF0" />
+        <register type="OA" address="0x00002790" value="0x0007FFFA" />
+        <register type="OA" address="0x00002794" value="0x0000BFEF" />
+        <register type="OA" address="0x00002798" value="0x0007FFFA" />
+        <register type="OA" address="0x0000279C" value="0x0000BFDF" />
+        <register type="OA" address="0x000027A0" value="0x0007FFFA" />
+        <register type="OA" address="0x000027A4" value="0x0000BFBF" />
+        <register type="OA" address="0x000027A8" value="0x0007FFFA" />
+        <register type="OA" address="0x000027AC" value="0x0000BF7F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00000003" />
+        <register type="FLEX" address="0x0000E658" value="0x00002001" />
+        <register type="FLEX" address="0x0000E758" value="0x00778008" />
+        <register type="FLEX" address="0x0000E45C" value="0x00088078" />
+        <register type="FLEX" address="0x0000E55C" value="0x00808708" />
+        <register type="FLEX" address="0x0000E65C" value="0x00A08908" />
+    </register_config>
+  </set>
+
+  <set name="Data Port Writes Coalescing Gen8"
+       mdapi_supported_apis="VK OGL4 OCL IO BB"
+       underscore_name="data_port_writes_coalescing"
+       hw_config_guid="343ebc99-4a55-414c-8c17-d8e259cf5e20"
+       chipset="BDW"
+       symbol_name="DataPortWritesCoalescing"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU to Data Port 0 Writes 128"
+             description="The subslice 0 EU data simd16 writes to Data Port with 192B per message."
+             data_type="uint64"
+             equation="B 6 READ 2 UDIV"
+             underscore_name="eu_hdc0_writes192_b"
+             units="messages"
+             symbol_name="EuHdc0Writes192B"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu0_active"
+             units="percent"
+             symbol_name="Fpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active"
+             units="percent"
+             symbol_name="Fpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU AVG IPC Rate"
+             description="The average rate of IPC calculated for 2 FPU pipelines."
+             data_type="float"
+             max_equation="2"
+             equation="A 9 READ  A 10 READ  A 11 READ UADD  A 9 READ USUB FDIV 1 FADD"
+             underscore_name="eu_avg_ipc_rate"
+             units="number"
+             symbol_name="EuAvgIpcRate"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="EU to Data Port 0 Writes 32B"
+             description="The subslice 0 EU data writes to Data Port with 32B per message."
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="eu_hdc0_writes32_b"
+             units="messages"
+             symbol_name="EuHdc0Writes32B"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU to Data Port 0 Writes 256B"
+             description="The subslice 0 EU data simd16 writes to Data Port with 256B per message."
+             data_type="uint64"
+             equation="B 7 READ 2 UDIV"
+             underscore_name="eu_hdc0_writes256_b_simd16"
+             units="messages"
+             symbol_name="EuHdc0Writes256BSimd16"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Data Port 0 to L3 Data Reads"
+             description="The subslice 0 Data Port data and constant reads from L3 cache."
+             data_type="uint64"
+             equation="C 4 READ"
+             underscore_name="hdc0_l3_data_reads"
+             units="messages"
+             symbol_name="Hdc0L3DataReads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Data Port 0 to L3 Data Writes"
+             description="The subslice 0 Data Port data writes to L3 cache."
+             data_type="uint64"
+             equation="C 5 READ"
+             underscore_name="hdc0_l3_data_writes"
+             units="messages"
+             symbol_name="Hdc0L3DataWrites"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EU to Data Port 0 Writes 64B"
+             description="The subslice 0 EU data simd16 writes to Data Port with 128B per message."
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="eu_hdc0_writes128_b_simd16"
+             units="messages"
+             symbol_name="EuHdc0Writes128BSimd16"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EU to Data Port 0 Writes 64B"
+             description="The subslice 0 EU data writes to Data Port with 64B per message."
+             data_type="uint64"
+             equation="B 2 READ 2 UDIV"
+             underscore_name="eu_hdc0_writes96_b"
+             units="messages"
+             symbol_name="EuHdc0Writes96B"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="EU Thread Occupancy"
+             description="The percentage of time in which hardware threads occupied EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ 8 UMUL $EuCoresTotalCount UDIV $EuThreadsCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_thread_occupancy"
+             units="percent"
+             symbol_name="EuThreadOccupancy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="All Data Port 0 Writes to L3"
+             description="The subslice 0 Data Port writes to L3 cache."
+             data_type="uint64"
+             equation="C 2 READ"
+             underscore_name="hdc0_l3_writes"
+             units="messages"
+             symbol_name="Hdc0L3Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU to Data Port 0 Writes 64B"
+             description="The subslice 0 EU data writes to Data Port with 64B per message."
+             data_type="uint64"
+             equation="B 1 READ B 4 READ UADD"
+             underscore_name="eu_hdc0_writes64_b"
+             units="messages"
+             symbol_name="EuHdc0Writes64B"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EU to Data Port 0 Writes 128"
+             description="The subslice 0 EU data writes to Data Port with 128B per message."
+             data_type="uint64"
+             equation="B 3 READ 2 UDIV"
+             underscore_name="eu_hdc0_writes128_b"
+             units="messages"
+             symbol_name="EuHdc0Writes128B"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuBytesWrittenPerCacheLine"
+             description="Average EU bytes written per L3 cache line."
+             data_type="float"
+             equation="$EuHdc0Writes32B 32 UMUL $EuHdc0Writes64B 64 UMUL $EuHdc0Writes96B 96 UMUL $EuHdc0Writes128B 128 UMUL $EuHdc0Writes128BSimd16 128 UMUL $EuHdc0Writes256BSimd16 256 UMUL $EuHdc0Writes192B 192 UMUL UADD UADD UADD UADD UADD UADD $Hdc0L3DataWrites FDIV"
+             underscore_name="eu_bytes_written_per_cache_line"
+             units="eu bytes per l3 cache line"
+             symbol_name="EuBytesWrittenPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuDataWritesPerCacheLine"
+             description="Coalescing ratio of EU write requests to L3 cache lines."
+             data_type="float"
+             equation="$EuBytesWrittenPerCacheLine 64 FDIV"
+             underscore_name="eu_data_writes_per_cache_line"
+             units="utilization"
+             symbol_name="EuDataWritesPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL 2 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses UADD UADD 64 UMUL"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="All Data Port 0 Reads from L3"
+             description="The subslice 0 Data Port reads from L3 cache."
+             data_type="uint64"
+             equation="C 3 READ C 2 READ USUB"
+             underscore_name="hdc0_l3_reads"
+             units="messages"
+             symbol_name="Hdc0L3Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="EU Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_send_active"
+             units="percent"
+             symbol_name="EuSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA"
+                     availability="$SubsliceMask 0x01 AND"
+                     priority="0"
+                     >
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x103D0005" />
+        <register type="NOA" address="0x00009888" value="0x143D0120" />
+        <register type="NOA" address="0x00009888" value="0x163D2400" />
+        <register type="NOA" address="0x00009888" value="0x1058022F" />
+        <register type="NOA" address="0x00009888" value="0x105B0000" />
+        <register type="NOA" address="0x00009888" value="0x198B0003" />
+        <register type="NOA" address="0x00009888" value="0x005CC000" />
+        <register type="NOA" address="0x00009888" value="0x065CC000" />
+        <register type="NOA" address="0x00009888" value="0x085CC000" />
+        <register type="NOA" address="0x00009888" value="0x0A5CC000" />
+        <register type="NOA" address="0x00009888" value="0x0E5CC000" />
+        <register type="NOA" address="0x00009888" value="0x025C4000" />
+        <register type="NOA" address="0x00009888" value="0x045C8000" />
+        <register type="NOA" address="0x00009888" value="0x003D0000" />
+        <register type="NOA" address="0x00009888" value="0x063D0094" />
+        <register type="NOA" address="0x00009888" value="0x083D0182" />
+        <register type="NOA" address="0x00009888" value="0x0A3D1814" />
+        <register type="NOA" address="0x00009888" value="0x0E3D0000" />
+        <register type="NOA" address="0x00009888" value="0x183D0000" />
+        <register type="NOA" address="0x00009888" value="0x1A3D0000" />
+        <register type="NOA" address="0x00009888" value="0x0C3D0000" />
+        <register type="NOA" address="0x00009888" value="0x0E582242" />
+        <register type="NOA" address="0x00009888" value="0x00586700" />
+        <register type="NOA" address="0x00009888" value="0x0258004F" />
+        <register type="NOA" address="0x00009888" value="0x0658C000" />
+        <register type="NOA" address="0x00009888" value="0x0858C000" />
+        <register type="NOA" address="0x00009888" value="0x0A58C000" />
+        <register type="NOA" address="0x00009888" value="0x045B6A80" />
+        <register type="NOA" address="0x00009888" value="0x005B4000" />
+        <register type="NOA" address="0x00009888" value="0x0E5B4000" />
+        <register type="NOA" address="0x00009888" value="0x185B5400" />
+        <register type="NOA" address="0x00009888" value="0x1A5B0141" />
+        <register type="NOA" address="0x00009888" value="0x025B4000" />
+        <register type="NOA" address="0x00009888" value="0x0A5B0000" />
+        <register type="NOA" address="0x00009888" value="0x0C5B4000" />
+        <register type="NOA" address="0x00009888" value="0x0C1FA800" />
+        <register type="NOA" address="0x00009888" value="0x0E1FAAA0" />
+        <register type="NOA" address="0x00009888" value="0x101F0282" />
+        <register type="NOA" address="0x00009888" value="0x00384000" />
+        <register type="NOA" address="0x00009888" value="0x0E384000" />
+        <register type="NOA" address="0x00009888" value="0x16384000" />
+        <register type="NOA" address="0x00009888" value="0x18381415" />
+        <register type="NOA" address="0x00009888" value="0x02384000" />
+        <register type="NOA" address="0x00009888" value="0x04384000" />
+        <register type="NOA" address="0x00009888" value="0x0A384000" />
+        <register type="NOA" address="0x00009888" value="0x0C384000" />
+        <register type="NOA" address="0x00009888" value="0x0039A000" />
+        <register type="NOA" address="0x00009888" value="0x0639A000" />
+        <register type="NOA" address="0x00009888" value="0x0839A000" />
+        <register type="NOA" address="0x00009888" value="0x0A39A000" />
+        <register type="NOA" address="0x00009888" value="0x0E39A000" />
+        <register type="NOA" address="0x00009888" value="0x02392000" />
+        <register type="NOA" address="0x00009888" value="0x04398000" />
+        <register type="NOA" address="0x00009888" value="0x018A8000" />
+        <register type="NOA" address="0x00009888" value="0x0F8A8000" />
+        <register type="NOA" address="0x00009888" value="0x198A8000" />
+        <register type="NOA" address="0x00009888" value="0x1B8A82A0" />
+        <register type="NOA" address="0x00009888" value="0x1D8A0002" />
+        <register type="NOA" address="0x00009888" value="0x038A8000" />
+        <register type="NOA" address="0x00009888" value="0x058A8000" />
+        <register type="NOA" address="0x00009888" value="0x0B8A8000" />
+        <register type="NOA" address="0x00009888" value="0x0D8A8000" />
+        <register type="NOA" address="0x00009888" value="0x038B6300" />
+        <register type="NOA" address="0x00009888" value="0x058B0062" />
+        <register type="NOA" address="0x00009888" value="0x118B0000" />
+        <register type="NOA" address="0x00009888" value="0x238B02A0" />
+        <register type="NOA" address="0x00009888" value="0x258B1555" />
+        <register type="NOA" address="0x00009888" value="0x278B0014" />
+        <register type="NOA" address="0x00009888" value="0x1F85AA80" />
+        <register type="NOA" address="0x00009888" value="0x21852AAA" />
+        <register type="NOA" address="0x00009888" value="0x23850028" />
+        <register type="NOA" address="0x00009888" value="0x01834000" />
+        <register type="NOA" address="0x00009888" value="0x0F834000" />
+        <register type="NOA" address="0x00009888" value="0x19835400" />
+        <register type="NOA" address="0x00009888" value="0x1B830141" />
+        <register type="NOA" address="0x00009888" value="0x03834000" />
+        <register type="NOA" address="0x00009888" value="0x05834000" />
+        <register type="NOA" address="0x00009888" value="0x07834000" />
+        <register type="NOA" address="0x00009888" value="0x09834000" />
+        <register type="NOA" address="0x00009888" value="0x0B834000" />
+        <register type="NOA" address="0x00009888" value="0x0D834000" />
+        <register type="NOA" address="0x00009888" value="0x0184C000" />
+        <register type="NOA" address="0x00009888" value="0x0784C000" />
+        <register type="NOA" address="0x00009888" value="0x0984C000" />
+        <register type="NOA" address="0x00009888" value="0x0B84C000" />
+        <register type="NOA" address="0x00009888" value="0x0F84C000" />
+        <register type="NOA" address="0x00009888" value="0x0384C000" />
+        <register type="NOA" address="0x00009888" value="0x0584C000" />
+        <register type="NOA" address="0x00009888" value="0x1180C000" />
+        <register type="NOA" address="0x00009888" value="0x1780C000" />
+        <register type="NOA" address="0x00009888" value="0x1980C000" />
+        <register type="NOA" address="0x00009888" value="0x1B80C000" />
+        <register type="NOA" address="0x00009888" value="0x1F80C000" />
+        <register type="NOA" address="0x00009888" value="0x1380C000" />
+        <register type="NOA" address="0x00009888" value="0x1580C000" />
+        <register type="NOA" address="0x00000D24" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x4D801000" />
+        <register type="NOA" address="0x00009888" value="0x3D800000" />
+        <register type="NOA" address="0x00009888" value="0x4F800001" />
+        <register type="NOA" address="0x00009888" value="0x43800000" />
+        <register type="NOA" address="0x00009888" value="0x51800000" />
+        <register type="NOA" address="0x00009888" value="0x45800000" />
+        <register type="NOA" address="0x00009888" value="0x21800000" />
+        <register type="NOA" address="0x00009888" value="0x31800000" />
+        <register type="NOA" address="0x00009888" value="0x53800000" />
+        <register type="NOA" address="0x00009888" value="0x47800420" />
+        <register type="NOA" address="0x00009888" value="0x3F800421" />
+        <register type="NOA" address="0x00009888" value="0x41800041" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x0000274C" value="0xBA98BA98" />
+        <register type="OA" address="0x00002748" value="0xBA98BA98" />
+        <register type="OA" address="0x00002744" value="0x00003377" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007FF72" />
+        <register type="OA" address="0x00002774" value="0x0000BFD0" />
+        <register type="OA" address="0x00002778" value="0x0007FF62" />
+        <register type="OA" address="0x0000277C" value="0x0000BFD0" />
+        <register type="OA" address="0x00002780" value="0x0007FF42" />
+        <register type="OA" address="0x00002784" value="0x0000BFD0" />
+        <register type="OA" address="0x00002788" value="0x0007FF02" />
+        <register type="OA" address="0x0000278C" value="0x0000BFD0" />
+        <register type="OA" address="0x00002790" value="0x0005FFF2" />
+        <register type="OA" address="0x00002794" value="0x0000BFD0" />
+        <register type="OA" address="0x00002798" value="0x0005FFE2" />
+        <register type="OA" address="0x0000279C" value="0x0000BFD0" />
+        <register type="OA" address="0x000027A0" value="0x0005FFC2" />
+        <register type="OA" address="0x000027A4" value="0x0000BFD0" />
+        <register type="OA" address="0x000027A8" value="0x0005FF82" />
+        <register type="OA" address="0x000027AC" value="0x0000BFD0" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00000003" />
+        <register type="FLEX" address="0x0000E658" value="0x00002001" />
+        <register type="FLEX" address="0x0000E758" value="0x00778008" />
+        <register type="FLEX" address="0x0000E45C" value="0x00088078" />
+        <register type="FLEX" address="0x0000E55C" value="0x00808708" />
+        <register type="FLEX" address="0x0000E65C" value="0x00A08908" />
+    </register_config>
+  </set>
+
+  <set name="Metric set HDCAndSF"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="hdc_and_sf"
+       hw_config_guid="78490af2-10fa-430b-ae3c-94ec04d5214e"
+       chipset="BDW"
+       symbol_name="HDCAndSF"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="Polygon Data Ready"
+             description="The percentage of time in which geometry pipeline output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="poly_data_ready"
+             units="percent"
+             symbol_name="PolyDataReady"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe/Strip-Fans"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="HDC stalled by L3 (s0.ss2)"
+             description="Percentage of time when HDC has messges to L3, but it's stalled due to lack of credits (s0.ss2)"
+             data_type="float"
+             max_equation="100"
+             equation="C 1 READ C 0 READ USUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader12_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader12AccessStalledOnL3"
+             availability="$SubsliceMask 0x20 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="HDC stalled by L3 (s0.ss1)"
+             description="Percentage of time when HDC has messges to L3, but it's stalled due to lack of credits (s0.ss1)"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ C 4 READ USUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader01_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader01AccessStalledOnL3"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="HDC stalled by L3 (s0.ss2)"
+             description="Percentage of time when HDC has messges to L3, but it's stalled due to lack of credits (s0.ss2)"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ C 6 READ USUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader02_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader02AccessStalledOnL3"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HDC stalled by L3 (s0.ss0)"
+             description="Percentage of time when HDC has messges to L3, but it's stalled due to lack of credits (s0.ss0)"
+             data_type="float"
+             max_equation="100"
+             equation="B 5 READ B 4 READ USUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader10_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader10AccessStalledOnL3"
+             availability="$SubsliceMask 0x8 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="HDC stalled by L3 (s0.ss1)"
+             description="Percentage of time when HDC has messges to L3, but it's stalled due to lack of credits (s0.ss1)"
+             data_type="float"
+             max_equation="100"
+             equation="B 7 READ B 6 READ USUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader11_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader11AccessStalledOnL3"
+             availability="$SubsliceMask 0x10 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL 2 UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="HDC stalled by L3 (s0.ss0)"
+             description="Percentage of time when HDC has messges to L3, but it's stalled due to lack of credits (s0.ss0)"
+             data_type="float"
+             max_equation="100"
+             equation="C 3 READ C 2 READ USUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader00_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader00AccessStalledOnL3"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x105C0232" />
+        <register type="NOA" address="0x00009888" value="0x10580232" />
+        <register type="NOA" address="0x00009888" value="0x10380232" />
+        <register type="NOA" address="0x00009888" value="0x10DC0232" />
+        <register type="NOA" address="0x00009888" value="0x10D80232" />
+        <register type="NOA" address="0x00009888" value="0x10B80232" />
+        <register type="NOA" address="0x00009888" value="0x118E4400" />
+        <register type="NOA" address="0x00009888" value="0x025C6080" />
+        <register type="NOA" address="0x00009888" value="0x045C004B" />
+        <register type="NOA" address="0x00009888" value="0x005C8000" />
+        <register type="NOA" address="0x00009888" value="0x00582080" />
+        <register type="NOA" address="0x00009888" value="0x0258004B" />
+        <register type="NOA" address="0x00009888" value="0x025B4000" />
+        <register type="NOA" address="0x00009888" value="0x045B4000" />
+        <register type="NOA" address="0x00009888" value="0x0C1FA000" />
+        <register type="NOA" address="0x00009888" value="0x0E1F00AA" />
+        <register type="NOA" address="0x00009888" value="0x04386080" />
+        <register type="NOA" address="0x00009888" value="0x0638404B" />
+        <register type="NOA" address="0x00009888" value="0x02384000" />
+        <register type="NOA" address="0x00009888" value="0x08384000" />
+        <register type="NOA" address="0x00009888" value="0x0A380000" />
+        <register type="NOA" address="0x00009888" value="0x0C380000" />
+        <register type="NOA" address="0x00009888" value="0x00398000" />
+        <register type="NOA" address="0x00009888" value="0x0239A000" />
+        <register type="NOA" address="0x00009888" value="0x0439A000" />
+        <register type="NOA" address="0x00009888" value="0x06392000" />
+        <register type="NOA" address="0x00009888" value="0x0CDC25C1" />
+        <register type="NOA" address="0x00009888" value="0x0ADCC000" />
+        <register type="NOA" address="0x00009888" value="0x0AD825C1" />
+        <register type="NOA" address="0x00009888" value="0x18DB4000" />
+        <register type="NOA" address="0x00009888" value="0x1ADB0001" />
+        <register type="NOA" address="0x00009888" value="0x0E9F8000" />
+        <register type="NOA" address="0x00009888" value="0x109F02AA" />
+        <register type="NOA" address="0x00009888" value="0x0EB825C1" />
+        <register type="NOA" address="0x00009888" value="0x18B80154" />
+        <register type="NOA" address="0x00009888" value="0x0AB9A000" />
+        <register type="NOA" address="0x00009888" value="0x0CB9A000" />
+        <register type="NOA" address="0x00009888" value="0x0EB9A000" />
+        <register type="NOA" address="0x00009888" value="0x0D88C000" />
+        <register type="NOA" address="0x00009888" value="0x0F88000F" />
+        <register type="NOA" address="0x00009888" value="0x038A8000" />
+        <register type="NOA" address="0x00009888" value="0x058A8000" />
+        <register type="NOA" address="0x00009888" value="0x078A8000" />
+        <register type="NOA" address="0x00009888" value="0x098A8000" />
+        <register type="NOA" address="0x00009888" value="0x0B8A8000" />
+        <register type="NOA" address="0x00009888" value="0x0D8A8000" />
+        <register type="NOA" address="0x00009888" value="0x258BAA05" />
+        <register type="NOA" address="0x00009888" value="0x278B002A" />
+        <register type="NOA" address="0x00009888" value="0x238B2A80" />
+        <register type="NOA" address="0x00009888" value="0x198C5400" />
+        <register type="NOA" address="0x00009888" value="0x1B8C0015" />
+        <register type="NOA" address="0x00009888" value="0x098DC000" />
+        <register type="NOA" address="0x00009888" value="0x0B8DA000" />
+        <register type="NOA" address="0x00009888" value="0x0D8DA000" />
+        <register type="NOA" address="0x00009888" value="0x0F8DA000" />
+        <register type="NOA" address="0x00009888" value="0x098E05C0" />
+        <register type="NOA" address="0x00009888" value="0x058E0000" />
+        <register type="NOA" address="0x00009888" value="0x198F0020" />
+        <register type="NOA" address="0x00009888" value="0x2185AA0A" />
+        <register type="NOA" address="0x00009888" value="0x2385002A" />
+        <register type="NOA" address="0x00009888" value="0x1F85AA00" />
+        <register type="NOA" address="0x00009888" value="0x19835000" />
+        <register type="NOA" address="0x00009888" value="0x1B830155" />
+        <register type="NOA" address="0x00009888" value="0x03834000" />
+        <register type="NOA" address="0x00009888" value="0x05834000" />
+        <register type="NOA" address="0x00009888" value="0x07834000" />
+        <register type="NOA" address="0x00009888" value="0x09834000" />
+        <register type="NOA" address="0x00009888" value="0x0B834000" />
+        <register type="NOA" address="0x00009888" value="0x0D834000" />
+        <register type="NOA" address="0x00009888" value="0x09848000" />
+        <register type="NOA" address="0x00009888" value="0x0B84C000" />
+        <register type="NOA" address="0x00009888" value="0x0D84C000" />
+        <register type="NOA" address="0x00009888" value="0x0F84C000" />
+        <register type="NOA" address="0x00009888" value="0x01848000" />
+        <register type="NOA" address="0x00009888" value="0x0384C000" />
+        <register type="NOA" address="0x00009888" value="0x0584C000" />
+        <register type="NOA" address="0x00009888" value="0x07844000" />
+        <register type="NOA" address="0x00009888" value="0x19808000" />
+        <register type="NOA" address="0x00009888" value="0x1B80C000" />
+        <register type="NOA" address="0x00009888" value="0x1D80C000" />
+        <register type="NOA" address="0x00009888" value="0x1F80C000" />
+        <register type="NOA" address="0x00009888" value="0x11808000" />
+        <register type="NOA" address="0x00009888" value="0x1380C000" />
+        <register type="NOA" address="0x00009888" value="0x1580C000" />
+        <register type="NOA" address="0x00009888" value="0x17804000" />
+        <register type="NOA" address="0x00009888" value="0x51800040" />
+        <register type="NOA" address="0x00009888" value="0x43800400" />
+        <register type="NOA" address="0x00009888" value="0x45800800" />
+        <register type="NOA" address="0x00009888" value="0x53800000" />
+        <register type="NOA" address="0x00009888" value="0x47800C62" />
+        <register type="NOA" address="0x00009888" value="0x21800000" />
+        <register type="NOA" address="0x00009888" value="0x31800000" />
+        <register type="NOA" address="0x00009888" value="0x4D800000" />
+        <register type="NOA" address="0x00009888" value="0x3F801042" />
+        <register type="NOA" address="0x00009888" value="0x4F800000" />
+        <register type="NOA" address="0x00009888" value="0x418014A4" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x10800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00000002" />
+        <register type="OA" address="0x00002774" value="0x0000FFF7" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set L3_1"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="l3_1"
+       hw_config_guid="c0abdd97-3b13-4cad-814c-bd178804e02c"
+       chipset="BDW"
+       symbol_name="L3_1"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice1 L3 Bank1 Stalled"
+             description="The percentage of time in which slice1 L3 bank1 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l31_bank1_stalled"
+             units="percent"
+             symbol_name="L31Bank1Stalled"
+             availability="$SliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Slice1 L3 Bank0 Stalled"
+             description="The percentage of time in which slice1 L3 bank0 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l31_bank0_stalled"
+             units="percent"
+             symbol_name="L31Bank0Stalled"
+             availability="$SliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="Slice1 L3 Bank1 Active"
+             description="The percentage of time in which slice1 L3 bank1 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l31_bank1_active"
+             units="percent"
+             symbol_name="L31Bank1Active"
+             availability="$SliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice1 L3 Bank0 Active"
+             description="The percentage of time in which slice1 L3 bank0 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l31_bank0_active"
+             units="percent"
+             symbol_name="L31Bank0Active"
+             availability="$SliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL 2 UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x10BF03DA" />
+        <register type="NOA" address="0x00009888" value="0x14BF0001" />
+        <register type="NOA" address="0x00009888" value="0x12980340" />
+        <register type="NOA" address="0x00009888" value="0x12990340" />
+        <register type="NOA" address="0x00009888" value="0x0CBF1187" />
+        <register type="NOA" address="0x00009888" value="0x0EBF1205" />
+        <register type="NOA" address="0x00009888" value="0x00BF0500" />
+        <register type="NOA" address="0x00009888" value="0x02BF042B" />
+        <register type="NOA" address="0x00009888" value="0x04BF002C" />
+        <register type="NOA" address="0x00009888" value="0x0CDAC000" />
+        <register type="NOA" address="0x00009888" value="0x0EDAC000" />
+        <register type="NOA" address="0x00009888" value="0x00DA8000" />
+        <register type="NOA" address="0x00009888" value="0x02DAC000" />
+        <register type="NOA" address="0x00009888" value="0x04DA4000" />
+        <register type="NOA" address="0x00009888" value="0x04983400" />
+        <register type="NOA" address="0x00009888" value="0x10980000" />
+        <register type="NOA" address="0x00009888" value="0x06990034" />
+        <register type="NOA" address="0x00009888" value="0x10990000" />
+        <register type="NOA" address="0x00009888" value="0x0C9DC000" />
+        <register type="NOA" address="0x00009888" value="0x0E9DC000" />
+        <register type="NOA" address="0x00009888" value="0x009D8000" />
+        <register type="NOA" address="0x00009888" value="0x029DC000" />
+        <register type="NOA" address="0x00009888" value="0x049D4000" />
+        <register type="NOA" address="0x00009888" value="0x109F02A8" />
+        <register type="NOA" address="0x00009888" value="0x0C9FA000" />
+        <register type="NOA" address="0x00009888" value="0x0E9F00BA" />
+        <register type="NOA" address="0x00009888" value="0x0CB88000" />
+        <register type="NOA" address="0x00009888" value="0x0CB95000" />
+        <register type="NOA" address="0x00009888" value="0x0EB95000" />
+        <register type="NOA" address="0x00009888" value="0x00B94000" />
+        <register type="NOA" address="0x00009888" value="0x02B95000" />
+        <register type="NOA" address="0x00009888" value="0x04B91000" />
+        <register type="NOA" address="0x00009888" value="0x06B92000" />
+        <register type="NOA" address="0x00009888" value="0x0CBA4000" />
+        <register type="NOA" address="0x00009888" value="0x0F88000F" />
+        <register type="NOA" address="0x00009888" value="0x03888000" />
+        <register type="NOA" address="0x00009888" value="0x05888000" />
+        <register type="NOA" address="0x00009888" value="0x07888000" />
+        <register type="NOA" address="0x00009888" value="0x09888000" />
+        <register type="NOA" address="0x00009888" value="0x0B888000" />
+        <register type="NOA" address="0x00009888" value="0x0D880400" />
+        <register type="NOA" address="0x00009888" value="0x258B800A" />
+        <register type="NOA" address="0x00009888" value="0x278B002A" />
+        <register type="NOA" address="0x00009888" value="0x238B5500" />
+        <register type="NOA" address="0x00009888" value="0x198C4000" />
+        <register type="NOA" address="0x00009888" value="0x1B8C0015" />
+        <register type="NOA" address="0x00009888" value="0x038C4000" />
+        <register type="NOA" address="0x00009888" value="0x058C4000" />
+        <register type="NOA" address="0x00009888" value="0x078C4000" />
+        <register type="NOA" address="0x00009888" value="0x098C4000" />
+        <register type="NOA" address="0x00009888" value="0x0B8C4000" />
+        <register type="NOA" address="0x00009888" value="0x0D8C4000" />
+        <register type="NOA" address="0x00009888" value="0x0D8DA000" />
+        <register type="NOA" address="0x00009888" value="0x0F8DA000" />
+        <register type="NOA" address="0x00009888" value="0x018D8000" />
+        <register type="NOA" address="0x00009888" value="0x038DA000" />
+        <register type="NOA" address="0x00009888" value="0x058DA000" />
+        <register type="NOA" address="0x00009888" value="0x078D2000" />
+        <register type="NOA" address="0x00009888" value="0x2185800A" />
+        <register type="NOA" address="0x00009888" value="0x2385002A" />
+        <register type="NOA" address="0x00009888" value="0x1F85AA00" />
+        <register type="NOA" address="0x00009888" value="0x1B830154" />
+        <register type="NOA" address="0x00009888" value="0x03834000" />
+        <register type="NOA" address="0x00009888" value="0x05834000" />
+        <register type="NOA" address="0x00009888" value="0x07834000" />
+        <register type="NOA" address="0x00009888" value="0x09834000" />
+        <register type="NOA" address="0x00009888" value="0x0B834000" />
+        <register type="NOA" address="0x00009888" value="0x0D834000" />
+        <register type="NOA" address="0x00009888" value="0x0D84C000" />
+        <register type="NOA" address="0x00009888" value="0x0F84C000" />
+        <register type="NOA" address="0x00009888" value="0x01848000" />
+        <register type="NOA" address="0x00009888" value="0x0384C000" />
+        <register type="NOA" address="0x00009888" value="0x0584C000" />
+        <register type="NOA" address="0x00009888" value="0x07844000" />
+        <register type="NOA" address="0x00009888" value="0x1D80C000" />
+        <register type="NOA" address="0x00009888" value="0x1F80C000" />
+        <register type="NOA" address="0x00009888" value="0x11808000" />
+        <register type="NOA" address="0x00009888" value="0x1380C000" />
+        <register type="NOA" address="0x00009888" value="0x1580C000" />
+        <register type="NOA" address="0x00009888" value="0x17804000" />
+        <register type="NOA" address="0x00009888" value="0x53800000" />
+        <register type="NOA" address="0x00009888" value="0x45800000" />
+        <register type="NOA" address="0x00009888" value="0x47800000" />
+        <register type="NOA" address="0x00009888" value="0x21800000" />
+        <register type="NOA" address="0x00009888" value="0x31800000" />
+        <register type="NOA" address="0x00009888" value="0x4D800000" />
+        <register type="NOA" address="0x00009888" value="0x3F800000" />
+        <register type="NOA" address="0x00009888" value="0x4F800000" />
+        <register type="NOA" address="0x00009888" value="0x41800060" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002770" value="0x00100070" />
+        <register type="OA" address="0x00002774" value="0x0000FFF1" />
+        <register type="OA" address="0x00002778" value="0x00014002" />
+        <register type="OA" address="0x0000277C" value="0x0000C3FF" />
+        <register type="OA" address="0x00002780" value="0x00010002" />
+        <register type="OA" address="0x00002784" value="0x0000C7FF" />
+        <register type="OA" address="0x00002788" value="0x00004002" />
+        <register type="OA" address="0x0000278C" value="0x0000D3FF" />
+        <register type="OA" address="0x00002790" value="0x00100700" />
+        <register type="OA" address="0x00002794" value="0x0000FF1F" />
+        <register type="OA" address="0x00002798" value="0x00001402" />
+        <register type="OA" address="0x0000279C" value="0x0000FC3F" />
+        <register type="OA" address="0x000027A0" value="0x00001002" />
+        <register type="OA" address="0x000027A4" value="0x0000FC7F" />
+        <register type="OA" address="0x000027A8" value="0x00000402" />
+        <register type="OA" address="0x000027AC" value="0x0000FD3F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set L3_2"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="l3_2"
+       hw_config_guid="ad665281-a7cf-483a-bd10-0e07c43f61c7"
+       chipset="BDW"
+       symbol_name="L3_2"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank1 Active"
+             description="The percentage of time in which slice0 L3 bank1 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank1_active"
+             units="percent"
+             symbol_name="L30Bank1Active"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="Slice0 L3 Bank1 Stalled"
+             description="The percentage of time in which slice0 L3 bank1 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank1_stalled"
+             units="percent"
+             symbol_name="L30Bank1Stalled"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank0 Active"
+             description="The percentage of time in which slice0 L3 bank0 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank0_active"
+             units="percent"
+             symbol_name="L30Bank0Active"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank0 Stalled"
+             description="The percentage of time in which slice0 L3 bank0 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank0_stalled"
+             units="percent"
+             symbol_name="L30Bank0Stalled"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL 2 UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x103F03DA" />
+        <register type="NOA" address="0x00009888" value="0x143F0001" />
+        <register type="NOA" address="0x00009888" value="0x12180340" />
+        <register type="NOA" address="0x00009888" value="0x12190340" />
+        <register type="NOA" address="0x00009888" value="0x0C3F1187" />
+        <register type="NOA" address="0x00009888" value="0x0E3F1205" />
+        <register type="NOA" address="0x00009888" value="0x003F0500" />
+        <register type="NOA" address="0x00009888" value="0x023F042B" />
+        <register type="NOA" address="0x00009888" value="0x043F002C" />
+        <register type="NOA" address="0x00009888" value="0x0C5AC000" />
+        <register type="NOA" address="0x00009888" value="0x0E5AC000" />
+        <register type="NOA" address="0x00009888" value="0x005A8000" />
+        <register type="NOA" address="0x00009888" value="0x025AC000" />
+        <register type="NOA" address="0x00009888" value="0x045A4000" />
+        <register type="NOA" address="0x00009888" value="0x04183400" />
+        <register type="NOA" address="0x00009888" value="0x10180000" />
+        <register type="NOA" address="0x00009888" value="0x06190034" />
+        <register type="NOA" address="0x00009888" value="0x10190000" />
+        <register type="NOA" address="0x00009888" value="0x0C1DC000" />
+        <register type="NOA" address="0x00009888" value="0x0E1DC000" />
+        <register type="NOA" address="0x00009888" value="0x001D8000" />
+        <register type="NOA" address="0x00009888" value="0x021DC000" />
+        <register type="NOA" address="0x00009888" value="0x041D4000" />
+        <register type="NOA" address="0x00009888" value="0x101F02A8" />
+        <register type="NOA" address="0x00009888" value="0x0C1FA000" />
+        <register type="NOA" address="0x00009888" value="0x0E1F00BA" />
+        <register type="NOA" address="0x00009888" value="0x0C388000" />
+        <register type="NOA" address="0x00009888" value="0x0C395000" />
+        <register type="NOA" address="0x00009888" value="0x0E395000" />
+        <register type="NOA" address="0x00009888" value="0x00394000" />
+        <register type="NOA" address="0x00009888" value="0x02395000" />
+        <register type="NOA" address="0x00009888" value="0x04391000" />
+        <register type="NOA" address="0x00009888" value="0x06392000" />
+        <register type="NOA" address="0x00009888" value="0x0C3A4000" />
+        <register type="NOA" address="0x00009888" value="0x1B8AA800" />
+        <register type="NOA" address="0x00009888" value="0x1D8A0002" />
+        <register type="NOA" address="0x00009888" value="0x038A8000" />
+        <register type="NOA" address="0x00009888" value="0x058A8000" />
+        <register type="NOA" address="0x00009888" value="0x078A8000" />
+        <register type="NOA" address="0x00009888" value="0x098A8000" />
+        <register type="NOA" address="0x00009888" value="0x0B8A8000" />
+        <register type="NOA" address="0x00009888" value="0x0D8A8000" />
+        <register type="NOA" address="0x00009888" value="0x258B4005" />
+        <register type="NOA" address="0x00009888" value="0x278B0015" />
+        <register type="NOA" address="0x00009888" value="0x238B2A80" />
+        <register type="NOA" address="0x00009888" value="0x2185800A" />
+        <register type="NOA" address="0x00009888" value="0x2385002A" />
+        <register type="NOA" address="0x00009888" value="0x1F85AA00" />
+        <register type="NOA" address="0x00009888" value="0x1B830154" />
+        <register type="NOA" address="0x00009888" value="0x03834000" />
+        <register type="NOA" address="0x00009888" value="0x05834000" />
+        <register type="NOA" address="0x00009888" value="0x07834000" />
+        <register type="NOA" address="0x00009888" value="0x09834000" />
+        <register type="NOA" address="0x00009888" value="0x0B834000" />
+        <register type="NOA" address="0x00009888" value="0x0D834000" />
+        <register type="NOA" address="0x00009888" value="0x0D84C000" />
+        <register type="NOA" address="0x00009888" value="0x0F84C000" />
+        <register type="NOA" address="0x00009888" value="0x01848000" />
+        <register type="NOA" address="0x00009888" value="0x0384C000" />
+        <register type="NOA" address="0x00009888" value="0x0584C000" />
+        <register type="NOA" address="0x00009888" value="0x07844000" />
+        <register type="NOA" address="0x00009888" value="0x1D80C000" />
+        <register type="NOA" address="0x00009888" value="0x1F80C000" />
+        <register type="NOA" address="0x00009888" value="0x11808000" />
+        <register type="NOA" address="0x00009888" value="0x1380C000" />
+        <register type="NOA" address="0x00009888" value="0x1580C000" />
+        <register type="NOA" address="0x00009888" value="0x17804000" />
+        <register type="NOA" address="0x00009888" value="0x53800000" />
+        <register type="NOA" address="0x00009888" value="0x45800000" />
+        <register type="NOA" address="0x00009888" value="0x47800000" />
+        <register type="NOA" address="0x00009888" value="0x21800000" />
+        <register type="NOA" address="0x00009888" value="0x31800000" />
+        <register type="NOA" address="0x00009888" value="0x4D800000" />
+        <register type="NOA" address="0x00009888" value="0x3F800000" />
+        <register type="NOA" address="0x00009888" value="0x4F800000" />
+        <register type="NOA" address="0x00009888" value="0x41800060" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002770" value="0x00100070" />
+        <register type="OA" address="0x00002774" value="0x0000FFF1" />
+        <register type="OA" address="0x00002778" value="0x00014002" />
+        <register type="OA" address="0x0000277C" value="0x0000C3FF" />
+        <register type="OA" address="0x00002780" value="0x00010002" />
+        <register type="OA" address="0x00002784" value="0x0000C7FF" />
+        <register type="OA" address="0x00002788" value="0x00004002" />
+        <register type="OA" address="0x0000278C" value="0x0000D3FF" />
+        <register type="OA" address="0x00002790" value="0x00100700" />
+        <register type="OA" address="0x00002794" value="0x0000FF1F" />
+        <register type="OA" address="0x00002798" value="0x00001402" />
+        <register type="OA" address="0x0000279C" value="0x0000FC3F" />
+        <register type="OA" address="0x000027A0" value="0x00001002" />
+        <register type="OA" address="0x000027A4" value="0x0000FC7F" />
+        <register type="OA" address="0x000027A8" value="0x00000402" />
+        <register type="OA" address="0x000027AC" value="0x0000FD3F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set L3_3"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="l3_3"
+       hw_config_guid="930a15aa-4300-4fce-a9ba-edb0b9e880be"
+       chipset="BDW"
+       symbol_name="L3_3"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Slice0 L3 Bank3 Stalled"
+             description="The percentage of time in which slice0 L3 bank3 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank3_stalled"
+             units="percent"
+             symbol_name="L30Bank3Stalled"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank3 Active"
+             description="The percentage of time in which slice0 L3 bank3 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank3_active"
+             units="percent"
+             symbol_name="L30Bank3Active"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice1 L3 Bank3 Active"
+             description="The percentage of time in which slice1 L3 bank3 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l31_bank3_active"
+             units="percent"
+             symbol_name="L31Bank3Active"
+             availability="$SliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Slice1 L3 Bank3 Stalled"
+             description="The percentage of time in which slice1 L3 bank3 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l31_bank3_stalled"
+             units="percent"
+             symbol_name="L31Bank3Stalled"
+             availability="$SliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL 2 UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x121B0340" />
+        <register type="NOA" address="0x00009888" value="0x103F0274" />
+        <register type="NOA" address="0x00009888" value="0x123F0000" />
+        <register type="NOA" address="0x00009888" value="0x129B0340" />
+        <register type="NOA" address="0x00009888" value="0x10BF0274" />
+        <register type="NOA" address="0x00009888" value="0x12BF0000" />
+        <register type="NOA" address="0x00009888" value="0x041B3400" />
+        <register type="NOA" address="0x00009888" value="0x101B0000" />
+        <register type="NOA" address="0x00009888" value="0x045C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A3D4000" />
+        <register type="NOA" address="0x00009888" value="0x003F0080" />
+        <register type="NOA" address="0x00009888" value="0x023F0793" />
+        <register type="NOA" address="0x00009888" value="0x043F0014" />
+        <register type="NOA" address="0x00009888" value="0x04588000" />
+        <register type="NOA" address="0x00009888" value="0x005A8000" />
+        <register type="NOA" address="0x00009888" value="0x025AC000" />
+        <register type="NOA" address="0x00009888" value="0x045A4000" />
+        <register type="NOA" address="0x00009888" value="0x0A5B4000" />
+        <register type="NOA" address="0x00009888" value="0x001D8000" />
+        <register type="NOA" address="0x00009888" value="0x021DC000" />
+        <register type="NOA" address="0x00009888" value="0x041D4000" />
+        <register type="NOA" address="0x00009888" value="0x0C1FA000" />
+        <register type="NOA" address="0x00009888" value="0x0E1F002A" />
+        <register type="NOA" address="0x00009888" value="0x0A384000" />
+        <register type="NOA" address="0x00009888" value="0x00394000" />
+        <register type="NOA" address="0x00009888" value="0x02395000" />
+        <register type="NOA" address="0x00009888" value="0x04399000" />
+        <register type="NOA" address="0x00009888" value="0x069B0034" />
+        <register type="NOA" address="0x00009888" value="0x109B0000" />
+        <register type="NOA" address="0x00009888" value="0x06DC4000" />
+        <register type="NOA" address="0x00009888" value="0x0CBD4000" />
+        <register type="NOA" address="0x00009888" value="0x0CBF0981" />
+        <register type="NOA" address="0x00009888" value="0x0EBF0A0F" />
+        <register type="NOA" address="0x00009888" value="0x06D84000" />
+        <register type="NOA" address="0x00009888" value="0x0CDAC000" />
+        <register type="NOA" address="0x00009888" value="0x0EDAC000" />
+        <register type="NOA" address="0x00009888" value="0x0CDB4000" />
+        <register type="NOA" address="0x00009888" value="0x0C9DC000" />
+        <register type="NOA" address="0x00009888" value="0x0E9DC000" />
+        <register type="NOA" address="0x00009888" value="0x109F02A8" />
+        <register type="NOA" address="0x00009888" value="0x0E9F0080" />
+        <register type="NOA" address="0x00009888" value="0x0CB84000" />
+        <register type="NOA" address="0x00009888" value="0x0CB95000" />
+        <register type="NOA" address="0x00009888" value="0x0EB95000" />
+        <register type="NOA" address="0x00009888" value="0x06B92000" />
+        <register type="NOA" address="0x00009888" value="0x0F88000F" />
+        <register type="NOA" address="0x00009888" value="0x0D880400" />
+        <register type="NOA" address="0x00009888" value="0x038A8000" />
+        <register type="NOA" address="0x00009888" value="0x058A8000" />
+        <register type="NOA" address="0x00009888" value="0x078A8000" />
+        <register type="NOA" address="0x00009888" value="0x098A8000" />
+        <register type="NOA" address="0x00009888" value="0x0B8A8000" />
+        <register type="NOA" address="0x00009888" value="0x258B8009" />
+        <register type="NOA" address="0x00009888" value="0x278B002A" />
+        <register type="NOA" address="0x00009888" value="0x238B2A80" />
+        <register type="NOA" address="0x00009888" value="0x198C4000" />
+        <register type="NOA" address="0x00009888" value="0x1B8C0015" />
+        <register type="NOA" address="0x00009888" value="0x0D8C4000" />
+        <register type="NOA" address="0x00009888" value="0x0D8DA000" />
+        <register type="NOA" address="0x00009888" value="0x0F8DA000" />
+        <register type="NOA" address="0x00009888" value="0x078D2000" />
+        <register type="NOA" address="0x00009888" value="0x2185800A" />
+        <register type="NOA" address="0x00009888" value="0x2385002A" />
+        <register type="NOA" address="0x00009888" value="0x1F85AA00" />
+        <register type="NOA" address="0x00009888" value="0x1B830154" />
+        <register type="NOA" address="0x00009888" value="0x03834000" />
+        <register type="NOA" address="0x00009888" value="0x05834000" />
+        <register type="NOA" address="0x00009888" value="0x07834000" />
+        <register type="NOA" address="0x00009888" value="0x09834000" />
+        <register type="NOA" address="0x00009888" value="0x0B834000" />
+        <register type="NOA" address="0x00009888" value="0x0D834000" />
+        <register type="NOA" address="0x00009888" value="0x0D84C000" />
+        <register type="NOA" address="0x00009888" value="0x0F84C000" />
+        <register type="NOA" address="0x00009888" value="0x01848000" />
+        <register type="NOA" address="0x00009888" value="0x0384C000" />
+        <register type="NOA" address="0x00009888" value="0x0584C000" />
+        <register type="NOA" address="0x00009888" value="0x07844000" />
+        <register type="NOA" address="0x00009888" value="0x1D80C000" />
+        <register type="NOA" address="0x00009888" value="0x1F80C000" />
+        <register type="NOA" address="0x00009888" value="0x11808000" />
+        <register type="NOA" address="0x00009888" value="0x1380C000" />
+        <register type="NOA" address="0x00009888" value="0x1580C000" />
+        <register type="NOA" address="0x00009888" value="0x17804000" />
+        <register type="NOA" address="0x00009888" value="0x53800000" />
+        <register type="NOA" address="0x00009888" value="0x45800C00" />
+        <register type="NOA" address="0x00009888" value="0x47800C63" />
+        <register type="NOA" address="0x00009888" value="0x21800000" />
+        <register type="NOA" address="0x00009888" value="0x31800000" />
+        <register type="NOA" address="0x00009888" value="0x4D800000" />
+        <register type="NOA" address="0x00009888" value="0x3F8014A5" />
+        <register type="NOA" address="0x00009888" value="0x4F800000" />
+        <register type="NOA" address="0x00009888" value="0x41800045" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002770" value="0x00100070" />
+        <register type="OA" address="0x00002774" value="0x0000FFF1" />
+        <register type="OA" address="0x00002778" value="0x00014002" />
+        <register type="OA" address="0x0000277C" value="0x0000C3FF" />
+        <register type="OA" address="0x00002780" value="0x00010002" />
+        <register type="OA" address="0x00002784" value="0x0000C7FF" />
+        <register type="OA" address="0x00002788" value="0x00004002" />
+        <register type="OA" address="0x0000278C" value="0x0000D3FF" />
+        <register type="OA" address="0x00002790" value="0x00100700" />
+        <register type="OA" address="0x00002794" value="0x0000FF1F" />
+        <register type="OA" address="0x00002798" value="0x00001402" />
+        <register type="OA" address="0x0000279C" value="0x0000FC3F" />
+        <register type="OA" address="0x000027A0" value="0x00001002" />
+        <register type="OA" address="0x000027A4" value="0x0000FC7F" />
+        <register type="OA" address="0x000027A8" value="0x00000402" />
+        <register type="OA" address="0x000027AC" value="0x0000FD3F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set L3_4"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="l3_4"
+       hw_config_guid="d7793b26-b5e3-4f0f-ad78-7ebc9d0b4c7d"
+       chipset="BDW"
+       symbol_name="L3_4"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank2 Stalled"
+             description="The percentage of time in which slice0 L3 bank2 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank2_stalled"
+             units="percent"
+             symbol_name="L30Bank2Stalled"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice1 L3 Bank2 Active"
+             description="The percentage of time in which slice1 L3 bank2 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l31_bank2_active"
+             units="percent"
+             symbol_name="L31Bank2Active"
+             availability="$SliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Slice0 L3 Bank2 Active"
+             description="The percentage of time in which slice0 L3 bank2 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank2_active"
+             units="percent"
+             symbol_name="L30Bank2Active"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="Slice1 L3 Bank2 Stalled"
+             description="The percentage of time in which slice1 L3 bank2 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l31_bank2_stalled"
+             units="percent"
+             symbol_name="L31Bank2Stalled"
+             availability="$SliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL 2 UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x121A0340" />
+        <register type="NOA" address="0x00009888" value="0x103F0017" />
+        <register type="NOA" address="0x00009888" value="0x123F0020" />
+        <register type="NOA" address="0x00009888" value="0x129A0340" />
+        <register type="NOA" address="0x00009888" value="0x10BF0017" />
+        <register type="NOA" address="0x00009888" value="0x12BF0020" />
+        <register type="NOA" address="0x00009888" value="0x041A3400" />
+        <register type="NOA" address="0x00009888" value="0x101A0000" />
+        <register type="NOA" address="0x00009888" value="0x043B8000" />
+        <register type="NOA" address="0x00009888" value="0x0A3E0010" />
+        <register type="NOA" address="0x00009888" value="0x003F0200" />
+        <register type="NOA" address="0x00009888" value="0x023F0113" />
+        <register type="NOA" address="0x00009888" value="0x043F0014" />
+        <register type="NOA" address="0x00009888" value="0x02592000" />
+        <register type="NOA" address="0x00009888" value="0x005A8000" />
+        <register type="NOA" address="0x00009888" value="0x025AC000" />
+        <register type="NOA" address="0x00009888" value="0x045A4000" />
+        <register type="NOA" address="0x00009888" value="0x0A1C8000" />
+        <register type="NOA" address="0x00009888" value="0x001D8000" />
+        <register type="NOA" address="0x00009888" value="0x021DC000" />
+        <register type="NOA" address="0x00009888" value="0x041D4000" />
+        <register type="NOA" address="0x00009888" value="0x0A1E8000" />
+        <register type="NOA" address="0x00009888" value="0x0C1FA000" />
+        <register type="NOA" address="0x00009888" value="0x0E1F001A" />
+        <register type="NOA" address="0x00009888" value="0x00394000" />
+        <register type="NOA" address="0x00009888" value="0x02395000" />
+        <register type="NOA" address="0x00009888" value="0x04391000" />
+        <register type="NOA" address="0x00009888" value="0x069A0034" />
+        <register type="NOA" address="0x00009888" value="0x109A0000" />
+        <register type="NOA" address="0x00009888" value="0x06BB4000" />
+        <register type="NOA" address="0x00009888" value="0x0ABE0040" />
+        <register type="NOA" address="0x00009888" value="0x0CBF0984" />
+        <register type="NOA" address="0x00009888" value="0x0EBF0A02" />
+        <register type="NOA" address="0x00009888" value="0x02D94000" />
+        <register type="NOA" address="0x00009888" value="0x0CDAC000" />
+        <register type="NOA" address="0x00009888" value="0x0EDAC000" />
+        <register type="NOA" address="0x00009888" value="0x0C9C0400" />
+        <register type="NOA" address="0x00009888" value="0x0C9DC000" />
+        <register type="NOA" address="0x00009888" value="0x0E9DC000" />
+        <register type="NOA" address="0x00009888" value="0x0C9E0400" />
+        <register type="NOA" address="0x00009888" value="0x109F02A8" />
+        <register type="NOA" address="0x00009888" value="0x0E9F0040" />
+        <register type="NOA" address="0x00009888" value="0x0CB95000" />
+        <register type="NOA" address="0x00009888" value="0x0EB95000" />
+        <register type="NOA" address="0x00009888" value="0x0F88000F" />
+        <register type="NOA" address="0x00009888" value="0x0D880400" />
+        <register type="NOA" address="0x00009888" value="0x038A8000" />
+        <register type="NOA" address="0x00009888" value="0x058A8000" />
+        <register type="NOA" address="0x00009888" value="0x078A8000" />
+        <register type="NOA" address="0x00009888" value="0x098A8000" />
+        <register type="NOA" address="0x00009888" value="0x0B8A8000" />
+        <register type="NOA" address="0x00009888" value="0x258B8009" />
+        <register type="NOA" address="0x00009888" value="0x278B002A" />
+        <register type="NOA" address="0x00009888" value="0x238B2A80" />
+        <register type="NOA" address="0x00009888" value="0x198C4000" />
+        <register type="NOA" address="0x00009888" value="0x1B8C0015" />
+        <register type="NOA" address="0x00009888" value="0x0D8C4000" />
+        <register type="NOA" address="0x00009888" value="0x0D8DA000" />
+        <register type="NOA" address="0x00009888" value="0x0F8DA000" />
+        <register type="NOA" address="0x00009888" value="0x078D2000" />
+        <register type="NOA" address="0x00009888" value="0x2185800A" />
+        <register type="NOA" address="0x00009888" value="0x2385002A" />
+        <register type="NOA" address="0x00009888" value="0x1F85AA00" />
+        <register type="NOA" address="0x00009888" value="0x1B830154" />
+        <register type="NOA" address="0x00009888" value="0x03834000" />
+        <register type="NOA" address="0x00009888" value="0x05834000" />
+        <register type="NOA" address="0x00009888" value="0x07834000" />
+        <register type="NOA" address="0x00009888" value="0x09834000" />
+        <register type="NOA" address="0x00009888" value="0x0B834000" />
+        <register type="NOA" address="0x00009888" value="0x0D834000" />
+        <register type="NOA" address="0x00009888" value="0x0D84C000" />
+        <register type="NOA" address="0x00009888" value="0x0F84C000" />
+        <register type="NOA" address="0x00009888" value="0x01848000" />
+        <register type="NOA" address="0x00009888" value="0x0384C000" />
+        <register type="NOA" address="0x00009888" value="0x0584C000" />
+        <register type="NOA" address="0x00009888" value="0x07844000" />
+        <register type="NOA" address="0x00009888" value="0x1D80C000" />
+        <register type="NOA" address="0x00009888" value="0x1F80C000" />
+        <register type="NOA" address="0x00009888" value="0x11808000" />
+        <register type="NOA" address="0x00009888" value="0x1380C000" />
+        <register type="NOA" address="0x00009888" value="0x1580C000" />
+        <register type="NOA" address="0x00009888" value="0x17804000" />
+        <register type="NOA" address="0x00009888" value="0x53800000" />
+        <register type="NOA" address="0x00009888" value="0x45800800" />
+        <register type="NOA" address="0x00009888" value="0x47800842" />
+        <register type="NOA" address="0x00009888" value="0x21800000" />
+        <register type="NOA" address="0x00009888" value="0x31800000" />
+        <register type="NOA" address="0x00009888" value="0x4D800000" />
+        <register type="NOA" address="0x00009888" value="0x3F801084" />
+        <register type="NOA" address="0x00009888" value="0x4F800000" />
+        <register type="NOA" address="0x00009888" value="0x41800044" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002770" value="0x00100070" />
+        <register type="OA" address="0x00002774" value="0x0000FFF1" />
+        <register type="OA" address="0x00002778" value="0x00014002" />
+        <register type="OA" address="0x0000277C" value="0x0000C3FF" />
+        <register type="OA" address="0x00002780" value="0x00010002" />
+        <register type="OA" address="0x00002784" value="0x0000C7FF" />
+        <register type="OA" address="0x00002788" value="0x00004002" />
+        <register type="OA" address="0x0000278C" value="0x0000D3FF" />
+        <register type="OA" address="0x00002790" value="0x00100700" />
+        <register type="OA" address="0x00002794" value="0x0000FF1F" />
+        <register type="OA" address="0x00002798" value="0x00001402" />
+        <register type="OA" address="0x0000279C" value="0x0000FC3F" />
+        <register type="OA" address="0x000027A0" value="0x00001002" />
+        <register type="OA" address="0x000027A4" value="0x0000FC7F" />
+        <register type="OA" address="0x000027A8" value="0x00000402" />
+        <register type="OA" address="0x000027AC" value="0x0000FD3F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set RasterizerAndPixelBackend"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="rasterizer_and_pixel_backend"
+       hw_config_guid="da0f7875-1143-4d73-a39c-9128a951c46a"
+       chipset="BDW"
+       symbol_name="RasterizerAndPixelBackend"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice1 Rasterizer Input Available"
+             description="The percentage of time in which slice1 rasterizer input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="rasterizer1_input_available"
+             units="percent"
+             symbol_name="Rasterizer1InputAvailable"
+             availability="$SliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Slice0 Pixel Values Ready"
+             description="The percentage of time in which slice0 pixel values are ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="pixel_values0_ready"
+             units="percent"
+             symbol_name="PixelValues0Ready"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="Slice0 Rasterizer Input Available"
+             description="The percentage of time in which slice0 rasterizer input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="rasterizer0_input_available"
+             units="percent"
+             symbol_name="Rasterizer0InputAvailable"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Slice0 Post-EarlyZ Pixel Data Ready"
+             description="The percentage of time in which slice0 post-EarlyZ pixel data is ready (after early Z tests have been applied)"
+             data_type="float"
+             max_equation="100"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="pixel_data0_ready"
+             units="percent"
+             symbol_name="PixelData0Ready"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer/Early Depth Test"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice1 Pixel Values Ready"
+             description="The percentage of time in which slice1 pixel values are ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="pixel_values1_ready"
+             units="percent"
+             symbol_name="PixelValues1Ready"
+             availability="$SliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Slice1 PS Output Available"
+             description="The percentage of time in which slice1 PS output is available"
+             data_type="float"
+             max_equation="100"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_output1_available"
+             units="percent"
+             symbol_name="PSOutput1Available"
+             availability="$SliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 Rasterizer Output Ready"
+             description="The percentage of time in which slice0 rasterizer output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="rasterizer0_output_ready"
+             units="percent"
+             symbol_name="Rasterizer0OutputReady"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Slice1 Rasterizer Output Ready"
+             description="The percentage of time in which slice1 rasterizer output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="rasterizer1_output_ready"
+             units="percent"
+             symbol_name="Rasterizer1OutputReady"
+             availability="$SliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Slice1 Post-EarlyZ Pixel Data Ready"
+             description="The percentage of time in which slice1 post-EarlyZ pixel data is ready (after early Z tests have been applied)"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="pixel_data1_ready"
+             units="percent"
+             symbol_name="PixelData1Ready"
+             availability="$SliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer/Early Depth Test"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL 2 UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Slice0 PS Output Available"
+             description="The percentage of time in which slice0 PS output is available"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_output0_available"
+             units="percent"
+             symbol_name="PSOutput0Available"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x143B000E" />
+        <register type="NOA" address="0x00009888" value="0x043C55C0" />
+        <register type="NOA" address="0x00009888" value="0x0A1E0280" />
+        <register type="NOA" address="0x00009888" value="0x0C1E0408" />
+        <register type="NOA" address="0x00009888" value="0x10390000" />
+        <register type="NOA" address="0x00009888" value="0x12397A1F" />
+        <register type="NOA" address="0x00009888" value="0x14BB000E" />
+        <register type="NOA" address="0x00009888" value="0x04BC5000" />
+        <register type="NOA" address="0x00009888" value="0x0A9E0296" />
+        <register type="NOA" address="0x00009888" value="0x0C9E0008" />
+        <register type="NOA" address="0x00009888" value="0x10B90000" />
+        <register type="NOA" address="0x00009888" value="0x12B97A1F" />
+        <register type="NOA" address="0x00009888" value="0x063B0042" />
+        <register type="NOA" address="0x00009888" value="0x103B0000" />
+        <register type="NOA" address="0x00009888" value="0x083C0000" />
+        <register type="NOA" address="0x00009888" value="0x0A3E0040" />
+        <register type="NOA" address="0x00009888" value="0x043F8000" />
+        <register type="NOA" address="0x00009888" value="0x02594000" />
+        <register type="NOA" address="0x00009888" value="0x045A8000" />
+        <register type="NOA" address="0x00009888" value="0x0C1C0400" />
+        <register type="NOA" address="0x00009888" value="0x041D8000" />
+        <register type="NOA" address="0x00009888" value="0x081E02C0" />
+        <register type="NOA" address="0x00009888" value="0x0E1E0000" />
+        <register type="NOA" address="0x00009888" value="0x0C1FA800" />
+        <register type="NOA" address="0x00009888" value="0x0E1F0260" />
+        <register type="NOA" address="0x00009888" value="0x101F0014" />
+        <register type="NOA" address="0x00009888" value="0x003905E0" />
+        <register type="NOA" address="0x00009888" value="0x06390BC0" />
+        <register type="NOA" address="0x00009888" value="0x02390018" />
+        <register type="NOA" address="0x00009888" value="0x04394000" />
+        <register type="NOA" address="0x00009888" value="0x04BB0042" />
+        <register type="NOA" address="0x00009888" value="0x10BB0000" />
+        <register type="NOA" address="0x00009888" value="0x02BC05C0" />
+        <register type="NOA" address="0x00009888" value="0x08BC0000" />
+        <register type="NOA" address="0x00009888" value="0x0ABE0004" />
+        <register type="NOA" address="0x00009888" value="0x02BF8000" />
+        <register type="NOA" address="0x00009888" value="0x02D91000" />
+        <register type="NOA" address="0x00009888" value="0x02DA8000" />
+        <register type="NOA" address="0x00009888" value="0x089C8000" />
+        <register type="NOA" address="0x00009888" value="0x029D8000" />
+        <register type="NOA" address="0x00009888" value="0x089E8000" />
+        <register type="NOA" address="0x00009888" value="0x0E9E0000" />
+        <register type="NOA" address="0x00009888" value="0x0E9FA806" />
+        <register type="NOA" address="0x00009888" value="0x109F0142" />
+        <register type="NOA" address="0x00009888" value="0x08B90617" />
+        <register type="NOA" address="0x00009888" value="0x0AB90BE0" />
+        <register type="NOA" address="0x00009888" value="0x02B94000" />
+        <register type="NOA" address="0x00009888" value="0x0D88F000" />
+        <register type="NOA" address="0x00009888" value="0x0F88000C" />
+        <register type="NOA" address="0x00009888" value="0x07888000" />
+        <register type="NOA" address="0x00009888" value="0x09888000" />
+        <register type="NOA" address="0x00009888" value="0x018A8000" />
+        <register type="NOA" address="0x00009888" value="0x0F8A8000" />
+        <register type="NOA" address="0x00009888" value="0x1B8A2800" />
+        <register type="NOA" address="0x00009888" value="0x038A8000" />
+        <register type="NOA" address="0x00009888" value="0x058A8000" />
+        <register type="NOA" address="0x00009888" value="0x0B8A8000" />
+        <register type="NOA" address="0x00009888" value="0x0D8A8000" />
+        <register type="NOA" address="0x00009888" value="0x238B52A0" />
+        <register type="NOA" address="0x00009888" value="0x258B6A95" />
+        <register type="NOA" address="0x00009888" value="0x278B0029" />
+        <register type="NOA" address="0x00009888" value="0x178C2000" />
+        <register type="NOA" address="0x00009888" value="0x198C1500" />
+        <register type="NOA" address="0x00009888" value="0x1B8C0014" />
+        <register type="NOA" address="0x00009888" value="0x078C4000" />
+        <register type="NOA" address="0x00009888" value="0x098C4000" />
+        <register type="NOA" address="0x00009888" value="0x098DA000" />
+        <register type="NOA" address="0x00009888" value="0x0B8DA000" />
+        <register type="NOA" address="0x00009888" value="0x0F8DA000" />
+        <register type="NOA" address="0x00009888" value="0x038D8000" />
+        <register type="NOA" address="0x00009888" value="0x058D2000" />
+        <register type="NOA" address="0x00009888" value="0x1F85AA80" />
+        <register type="NOA" address="0x00009888" value="0x2185AAAA" />
+        <register type="NOA" address="0x00009888" value="0x2385002A" />
+        <register type="NOA" address="0x00009888" value="0x01834000" />
+        <register type="NOA" address="0x00009888" value="0x0F834000" />
+        <register type="NOA" address="0x00009888" value="0x19835400" />
+        <register type="NOA" address="0x00009888" value="0x1B830155" />
+        <register type="NOA" address="0x00009888" value="0x03834000" />
+        <register type="NOA" address="0x00009888" value="0x05834000" />
+        <register type="NOA" address="0x00009888" value="0x07834000" />
+        <register type="NOA" address="0x00009888" value="0x09834000" />
+        <register type="NOA" address="0x00009888" value="0x0B834000" />
+        <register type="NOA" address="0x00009888" value="0x0D834000" />
+        <register type="NOA" address="0x00009888" value="0x0184C000" />
+        <register type="NOA" address="0x00009888" value="0x0784C000" />
+        <register type="NOA" address="0x00009888" value="0x0984C000" />
+        <register type="NOA" address="0x00009888" value="0x0B84C000" />
+        <register type="NOA" address="0x00009888" value="0x0D84C000" />
+        <register type="NOA" address="0x00009888" value="0x0F84C000" />
+        <register type="NOA" address="0x00009888" value="0x0384C000" />
+        <register type="NOA" address="0x00009888" value="0x0584C000" />
+        <register type="NOA" address="0x00009888" value="0x1180C000" />
+        <register type="NOA" address="0x00009888" value="0x1780C000" />
+        <register type="NOA" address="0x00009888" value="0x1980C000" />
+        <register type="NOA" address="0x00009888" value="0x1B80C000" />
+        <register type="NOA" address="0x00009888" value="0x1D80C000" />
+        <register type="NOA" address="0x00009888" value="0x1F80C000" />
+        <register type="NOA" address="0x00009888" value="0x1380C000" />
+        <register type="NOA" address="0x00009888" value="0x1580C000" />
+        <register type="NOA" address="0x00009888" value="0x4D800444" />
+        <register type="NOA" address="0x00009888" value="0x3D800000" />
+        <register type="NOA" address="0x00009888" value="0x4F804000" />
+        <register type="NOA" address="0x00009888" value="0x43801080" />
+        <register type="NOA" address="0x00009888" value="0x51800000" />
+        <register type="NOA" address="0x00009888" value="0x45800084" />
+        <register type="NOA" address="0x00009888" value="0x53800044" />
+        <register type="NOA" address="0x00009888" value="0x47801080" />
+        <register type="NOA" address="0x00009888" value="0x21800000" />
+        <register type="NOA" address="0x00009888" value="0x31800000" />
+        <register type="NOA" address="0x00009888" value="0x3F800000" />
+        <register type="NOA" address="0x00009888" value="0x41800840" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x30800000" />
+        <register type="OA" address="0x00002770" value="0x00006000" />
+        <register type="OA" address="0x00002774" value="0x0000F3FF" />
+        <register type="OA" address="0x00002778" value="0x00001800" />
+        <register type="OA" address="0x0000277C" value="0x0000FCFF" />
+        <register type="OA" address="0x00002780" value="0x00000600" />
+        <register type="OA" address="0x00002784" value="0x0000FF3F" />
+        <register type="OA" address="0x00002788" value="0x00000180" />
+        <register type="OA" address="0x0000278C" value="0x0000FFCF" />
+        <register type="OA" address="0x00002790" value="0x00000060" />
+        <register type="OA" address="0x00002794" value="0x0000FFF3" />
+        <register type="OA" address="0x00002798" value="0x00000018" />
+        <register type="OA" address="0x0000279C" value="0x0000FFFC" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set Sampler_1"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="sampler_1"
+       hw_config_guid="52c186e4-39e3-4534-87cd-41bd47763df9"
+       chipset="BDW"
+       symbol_name="Sampler_1"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Slice1 Subslice0 Input Available"
+             description="The percentage of time in which slice1 subslice0 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler10_input_available"
+             units="percent"
+             symbol_name="Sampler10InputAvailable"
+             availability="$SubsliceMask 0x8 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Slice1 Subslice2 Sampler Output Ready"
+             description="The percentage of time in which slice1 subslice2 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler12_output_ready"
+             units="percent"
+             symbol_name="Sampler12OutputReady"
+             availability="$SubsliceMask 0x20 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice1 Subslice1 Input Available"
+             description="The percentage of time in which slice1 subslice1 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler11_input_available"
+             units="percent"
+             symbol_name="Sampler11InputAvailable"
+             availability="$SubsliceMask 0x10 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Slice1 Subslice2 Input Available"
+             description="The percentage of time in which slice1 subslice2 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler12_input_available"
+             units="percent"
+             symbol_name="Sampler12InputAvailable"
+             availability="$SubsliceMask 0x20 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Slice1 Subslice0 Sampler Output Ready"
+             description="The percentage of time in which slice1 subslice0 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler10_output_ready"
+             units="percent"
+             symbol_name="Sampler10OutputReady"
+             availability="$SubsliceMask 0x8 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Slice1 Subslice1 Sampler Output Ready"
+             description="The percentage of time in which slice1 subslice1 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler11_output_ready"
+             units="percent"
+             symbol_name="Sampler11OutputReady"
+             availability="$SubsliceMask 0x10 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL 2 UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x18921400" />
+        <register type="NOA" address="0x00009888" value="0x149500AB" />
+        <register type="NOA" address="0x00009888" value="0x18B21400" />
+        <register type="NOA" address="0x00009888" value="0x14B500AB" />
+        <register type="NOA" address="0x00009888" value="0x18D21400" />
+        <register type="NOA" address="0x00009888" value="0x14D500AB" />
+        <register type="NOA" address="0x00009888" value="0x0CDC8000" />
+        <register type="NOA" address="0x00009888" value="0x0EDC4000" />
+        <register type="NOA" address="0x00009888" value="0x02DCC000" />
+        <register type="NOA" address="0x00009888" value="0x04DCC000" />
+        <register type="NOA" address="0x00009888" value="0x1ABD00A0" />
+        <register type="NOA" address="0x00009888" value="0x0ABD8000" />
+        <register type="NOA" address="0x00009888" value="0x0CD88000" />
+        <register type="NOA" address="0x00009888" value="0x0ED84000" />
+        <register type="NOA" address="0x00009888" value="0x04D88000" />
+        <register type="NOA" address="0x00009888" value="0x1ADB0050" />
+        <register type="NOA" address="0x00009888" value="0x04DB8000" />
+        <register type="NOA" address="0x00009888" value="0x06DB8000" />
+        <register type="NOA" address="0x00009888" value="0x08DB8000" />
+        <register type="NOA" address="0x00009888" value="0x0ADB4000" />
+        <register type="NOA" address="0x00009888" value="0x109F02A0" />
+        <register type="NOA" address="0x00009888" value="0x0C9FA000" />
+        <register type="NOA" address="0x00009888" value="0x0E9F00AA" />
+        <register type="NOA" address="0x00009888" value="0x18B82500" />
+        <register type="NOA" address="0x00009888" value="0x02B88000" />
+        <register type="NOA" address="0x00009888" value="0x04B84000" />
+        <register type="NOA" address="0x00009888" value="0x06B84000" />
+        <register type="NOA" address="0x00009888" value="0x08B84000" />
+        <register type="NOA" address="0x00009888" value="0x0AB84000" />
+        <register type="NOA" address="0x00009888" value="0x0CB88000" />
+        <register type="NOA" address="0x00009888" value="0x0CB98000" />
+        <register type="NOA" address="0x00009888" value="0x0EB9A000" />
+        <register type="NOA" address="0x00009888" value="0x00B98000" />
+        <register type="NOA" address="0x00009888" value="0x02B9A000" />
+        <register type="NOA" address="0x00009888" value="0x04B9A000" />
+        <register type="NOA" address="0x00009888" value="0x06B92000" />
+        <register type="NOA" address="0x00009888" value="0x1ABA0200" />
+        <register type="NOA" address="0x00009888" value="0x02BA8000" />
+        <register type="NOA" address="0x00009888" value="0x0CBA8000" />
+        <register type="NOA" address="0x00009888" value="0x04908000" />
+        <register type="NOA" address="0x00009888" value="0x04918000" />
+        <register type="NOA" address="0x00009888" value="0x04927300" />
+        <register type="NOA" address="0x00009888" value="0x10920000" />
+        <register type="NOA" address="0x00009888" value="0x1893000A" />
+        <register type="NOA" address="0x00009888" value="0x0A934000" />
+        <register type="NOA" address="0x00009888" value="0x0A946000" />
+        <register type="NOA" address="0x00009888" value="0x0C959000" />
+        <register type="NOA" address="0x00009888" value="0x0E950098" />
+        <register type="NOA" address="0x00009888" value="0x10950000" />
+        <register type="NOA" address="0x00009888" value="0x04B04000" />
+        <register type="NOA" address="0x00009888" value="0x04B14000" />
+        <register type="NOA" address="0x00009888" value="0x04B20073" />
+        <register type="NOA" address="0x00009888" value="0x10B20000" />
+        <register type="NOA" address="0x00009888" value="0x04B38000" />
+        <register type="NOA" address="0x00009888" value="0x06B38000" />
+        <register type="NOA" address="0x00009888" value="0x08B34000" />
+        <register type="NOA" address="0x00009888" value="0x04B4C000" />
+        <register type="NOA" address="0x00009888" value="0x02B59890" />
+        <register type="NOA" address="0x00009888" value="0x10B50000" />
+        <register type="NOA" address="0x00009888" value="0x06D04000" />
+        <register type="NOA" address="0x00009888" value="0x06D14000" />
+        <register type="NOA" address="0x00009888" value="0x06D20073" />
+        <register type="NOA" address="0x00009888" value="0x10D20000" />
+        <register type="NOA" address="0x00009888" value="0x18D30020" />
+        <register type="NOA" address="0x00009888" value="0x02D38000" />
+        <register type="NOA" address="0x00009888" value="0x0CD34000" />
+        <register type="NOA" address="0x00009888" value="0x0AD48000" />
+        <register type="NOA" address="0x00009888" value="0x04D42000" />
+        <register type="NOA" address="0x00009888" value="0x0ED59000" />
+        <register type="NOA" address="0x00009888" value="0x00D59800" />
+        <register type="NOA" address="0x00009888" value="0x10D50000" />
+        <register type="NOA" address="0x00009888" value="0x0F88000E" />
+        <register type="NOA" address="0x00009888" value="0x03888000" />
+        <register type="NOA" address="0x00009888" value="0x05888000" />
+        <register type="NOA" address="0x00009888" value="0x07888000" />
+        <register type="NOA" address="0x00009888" value="0x09888000" />
+        <register type="NOA" address="0x00009888" value="0x0B888000" />
+        <register type="NOA" address="0x00009888" value="0x0D880400" />
+        <register type="NOA" address="0x00009888" value="0x278B002A" />
+        <register type="NOA" address="0x00009888" value="0x238B5500" />
+        <register type="NOA" address="0x00009888" value="0x258B000A" />
+        <register type="NOA" address="0x00009888" value="0x1B8C0015" />
+        <register type="NOA" address="0x00009888" value="0x038C4000" />
+        <register type="NOA" address="0x00009888" value="0x058C4000" />
+        <register type="NOA" address="0x00009888" value="0x078C4000" />
+        <register type="NOA" address="0x00009888" value="0x098C4000" />
+        <register type="NOA" address="0x00009888" value="0x0B8C4000" />
+        <register type="NOA" address="0x00009888" value="0x0D8C4000" />
+        <register type="NOA" address="0x00009888" value="0x0D8D8000" />
+        <register type="NOA" address="0x00009888" value="0x0F8DA000" />
+        <register type="NOA" address="0x00009888" value="0x018D8000" />
+        <register type="NOA" address="0x00009888" value="0x038DA000" />
+        <register type="NOA" address="0x00009888" value="0x058DA000" />
+        <register type="NOA" address="0x00009888" value="0x078D2000" />
+        <register type="NOA" address="0x00009888" value="0x2385002A" />
+        <register type="NOA" address="0x00009888" value="0x1F85AA00" />
+        <register type="NOA" address="0x00009888" value="0x2185000A" />
+        <register type="NOA" address="0x00009888" value="0x1B830150" />
+        <register type="NOA" address="0x00009888" value="0x03834000" />
+        <register type="NOA" address="0x00009888" value="0x05834000" />
+        <register type="NOA" address="0x00009888" value="0x07834000" />
+        <register type="NOA" address="0x00009888" value="0x09834000" />
+        <register type="NOA" address="0x00009888" value="0x0B834000" />
+        <register type="NOA" address="0x00009888" value="0x0D834000" />
+        <register type="NOA" address="0x00009888" value="0x0D848000" />
+        <register type="NOA" address="0x00009888" value="0x0F84C000" />
+        <register type="NOA" address="0x00009888" value="0x01848000" />
+        <register type="NOA" address="0x00009888" value="0x0384C000" />
+        <register type="NOA" address="0x00009888" value="0x0584C000" />
+        <register type="NOA" address="0x00009888" value="0x07844000" />
+        <register type="NOA" address="0x00009888" value="0x1D808000" />
+        <register type="NOA" address="0x00009888" value="0x1F80C000" />
+        <register type="NOA" address="0x00009888" value="0x11808000" />
+        <register type="NOA" address="0x00009888" value="0x1380C000" />
+        <register type="NOA" address="0x00009888" value="0x1580C000" />
+        <register type="NOA" address="0x00009888" value="0x17804000" />
+        <register type="NOA" address="0x00009888" value="0x53800000" />
+        <register type="NOA" address="0x00009888" value="0x47801021" />
+        <register type="NOA" address="0x00009888" value="0x21800000" />
+        <register type="NOA" address="0x00009888" value="0x31800000" />
+        <register type="NOA" address="0x00009888" value="0x4D800000" />
+        <register type="NOA" address="0x00009888" value="0x3F800C64" />
+        <register type="NOA" address="0x00009888" value="0x4F800000" />
+        <register type="NOA" address="0x00009888" value="0x41800C02" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x70800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x0000C000" />
+        <register type="OA" address="0x00002774" value="0x0000E7FF" />
+        <register type="OA" address="0x00002778" value="0x00003000" />
+        <register type="OA" address="0x0000277C" value="0x0000F9FF" />
+        <register type="OA" address="0x00002780" value="0x00000C00" />
+        <register type="OA" address="0x00002784" value="0x0000FE7F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set Sampler_2"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="sampler_2"
+       hw_config_guid="edcb8c31-764d-451a-9ecd-c9c89fb54f8d"
+       chipset="BDW"
+       symbol_name="Sampler_2"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 Subslice2 Input Available"
+             description="The percentage of time in which slice0 subslice2 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler02_input_available"
+             units="percent"
+             symbol_name="Sampler02InputAvailable"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 Subslice0 Input Available"
+             description="The percentage of time in which slice0 subslice0 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler00_input_available"
+             units="percent"
+             symbol_name="Sampler00InputAvailable"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="Slice0 Subslice2 Sampler Output Ready"
+             description="The percentage of time in which slice0 subslice2 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler02_output_ready"
+             units="percent"
+             symbol_name="Sampler02OutputReady"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Slice0 Subslice1 Input Available"
+             description="The percentage of time in which slice0 subslice1 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler01_input_available"
+             units="percent"
+             symbol_name="Sampler01InputAvailable"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Slice0 Subslice0 Sampler Output Ready"
+             description="The percentage of time in which slice0 subslice0 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler00_output_ready"
+             units="percent"
+             symbol_name="Sampler00OutputReady"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Slice0 Subslice1 Sampler Output Ready"
+             description="The percentage of time in which slice0 subslice1 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler01_output_ready"
+             units="percent"
+             symbol_name="Sampler01OutputReady"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL 2 UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x18121400" />
+        <register type="NOA" address="0x00009888" value="0x141500AB" />
+        <register type="NOA" address="0x00009888" value="0x18321400" />
+        <register type="NOA" address="0x00009888" value="0x143500AB" />
+        <register type="NOA" address="0x00009888" value="0x18521400" />
+        <register type="NOA" address="0x00009888" value="0x145500AB" />
+        <register type="NOA" address="0x00009888" value="0x0C5C8000" />
+        <register type="NOA" address="0x00009888" value="0x0E5C4000" />
+        <register type="NOA" address="0x00009888" value="0x025CC000" />
+        <register type="NOA" address="0x00009888" value="0x045CC000" />
+        <register type="NOA" address="0x00009888" value="0x1A3D00A0" />
+        <register type="NOA" address="0x00009888" value="0x0A3D8000" />
+        <register type="NOA" address="0x00009888" value="0x0C588000" />
+        <register type="NOA" address="0x00009888" value="0x0E584000" />
+        <register type="NOA" address="0x00009888" value="0x04588000" />
+        <register type="NOA" address="0x00009888" value="0x1A5B0050" />
+        <register type="NOA" address="0x00009888" value="0x045B8000" />
+        <register type="NOA" address="0x00009888" value="0x065B8000" />
+        <register type="NOA" address="0x00009888" value="0x085B8000" />
+        <register type="NOA" address="0x00009888" value="0x0A5B4000" />
+        <register type="NOA" address="0x00009888" value="0x101F02A0" />
+        <register type="NOA" address="0x00009888" value="0x0C1FA000" />
+        <register type="NOA" address="0x00009888" value="0x0E1F00AA" />
+        <register type="NOA" address="0x00009888" value="0x18382500" />
+        <register type="NOA" address="0x00009888" value="0x02388000" />
+        <register type="NOA" address="0x00009888" value="0x04384000" />
+        <register type="NOA" address="0x00009888" value="0x06384000" />
+        <register type="NOA" address="0x00009888" value="0x08384000" />
+        <register type="NOA" address="0x00009888" value="0x0A384000" />
+        <register type="NOA" address="0x00009888" value="0x0C388000" />
+        <register type="NOA" address="0x00009888" value="0x0C398000" />
+        <register type="NOA" address="0x00009888" value="0x0E39A000" />
+        <register type="NOA" address="0x00009888" value="0x00398000" />
+        <register type="NOA" address="0x00009888" value="0x0239A000" />
+        <register type="NOA" address="0x00009888" value="0x0439A000" />
+        <register type="NOA" address="0x00009888" value="0x06392000" />
+        <register type="NOA" address="0x00009888" value="0x1A3A0200" />
+        <register type="NOA" address="0x00009888" value="0x023A8000" />
+        <register type="NOA" address="0x00009888" value="0x0C3A8000" />
+        <register type="NOA" address="0x00009888" value="0x04108000" />
+        <register type="NOA" address="0x00009888" value="0x04118000" />
+        <register type="NOA" address="0x00009888" value="0x04127300" />
+        <register type="NOA" address="0x00009888" value="0x10120000" />
+        <register type="NOA" address="0x00009888" value="0x1813000A" />
+        <register type="NOA" address="0x00009888" value="0x0A134000" />
+        <register type="NOA" address="0x00009888" value="0x0A146000" />
+        <register type="NOA" address="0x00009888" value="0x0C159000" />
+        <register type="NOA" address="0x00009888" value="0x0E150098" />
+        <register type="NOA" address="0x00009888" value="0x10150000" />
+        <register type="NOA" address="0x00009888" value="0x04304000" />
+        <register type="NOA" address="0x00009888" value="0x04314000" />
+        <register type="NOA" address="0x00009888" value="0x04320073" />
+        <register type="NOA" address="0x00009888" value="0x10320000" />
+        <register type="NOA" address="0x00009888" value="0x04338000" />
+        <register type="NOA" address="0x00009888" value="0x06338000" />
+        <register type="NOA" address="0x00009888" value="0x08334000" />
+        <register type="NOA" address="0x00009888" value="0x0434C000" />
+        <register type="NOA" address="0x00009888" value="0x02359890" />
+        <register type="NOA" address="0x00009888" value="0x10350000" />
+        <register type="NOA" address="0x00009888" value="0x06504000" />
+        <register type="NOA" address="0x00009888" value="0x06514000" />
+        <register type="NOA" address="0x00009888" value="0x06520073" />
+        <register type="NOA" address="0x00009888" value="0x10520000" />
+        <register type="NOA" address="0x00009888" value="0x18530020" />
+        <register type="NOA" address="0x00009888" value="0x02538000" />
+        <register type="NOA" address="0x00009888" value="0x0C534000" />
+        <register type="NOA" address="0x00009888" value="0x0A548000" />
+        <register type="NOA" address="0x00009888" value="0x04542000" />
+        <register type="NOA" address="0x00009888" value="0x0E559000" />
+        <register type="NOA" address="0x00009888" value="0x00559800" />
+        <register type="NOA" address="0x00009888" value="0x10550000" />
+        <register type="NOA" address="0x00009888" value="0x1B8AA000" />
+        <register type="NOA" address="0x00009888" value="0x1D8A0002" />
+        <register type="NOA" address="0x00009888" value="0x038A8000" />
+        <register type="NOA" address="0x00009888" value="0x058A8000" />
+        <register type="NOA" address="0x00009888" value="0x078A8000" />
+        <register type="NOA" address="0x00009888" value="0x098A8000" />
+        <register type="NOA" address="0x00009888" value="0x0B8A8000" />
+        <register type="NOA" address="0x00009888" value="0x0D8A8000" />
+        <register type="NOA" address="0x00009888" value="0x278B0015" />
+        <register type="NOA" address="0x00009888" value="0x238B2A80" />
+        <register type="NOA" address="0x00009888" value="0x258B0005" />
+        <register type="NOA" address="0x00009888" value="0x2385002A" />
+        <register type="NOA" address="0x00009888" value="0x1F85AA00" />
+        <register type="NOA" address="0x00009888" value="0x2185000A" />
+        <register type="NOA" address="0x00009888" value="0x1B830150" />
+        <register type="NOA" address="0x00009888" value="0x03834000" />
+        <register type="NOA" address="0x00009888" value="0x05834000" />
+        <register type="NOA" address="0x00009888" value="0x07834000" />
+        <register type="NOA" address="0x00009888" value="0x09834000" />
+        <register type="NOA" address="0x00009888" value="0x0B834000" />
+        <register type="NOA" address="0x00009888" value="0x0D834000" />
+        <register type="NOA" address="0x00009888" value="0x0D848000" />
+        <register type="NOA" address="0x00009888" value="0x0F84C000" />
+        <register type="NOA" address="0x00009888" value="0x01848000" />
+        <register type="NOA" address="0x00009888" value="0x0384C000" />
+        <register type="NOA" address="0x00009888" value="0x0584C000" />
+        <register type="NOA" address="0x00009888" value="0x07844000" />
+        <register type="NOA" address="0x00009888" value="0x1D808000" />
+        <register type="NOA" address="0x00009888" value="0x1F80C000" />
+        <register type="NOA" address="0x00009888" value="0x11808000" />
+        <register type="NOA" address="0x00009888" value="0x1380C000" />
+        <register type="NOA" address="0x00009888" value="0x1580C000" />
+        <register type="NOA" address="0x00009888" value="0x17804000" />
+        <register type="NOA" address="0x00009888" value="0x53800000" />
+        <register type="NOA" address="0x00009888" value="0x47801021" />
+        <register type="NOA" address="0x00009888" value="0x21800000" />
+        <register type="NOA" address="0x00009888" value="0x31800000" />
+        <register type="NOA" address="0x00009888" value="0x4D800000" />
+        <register type="NOA" address="0x00009888" value="0x3F800C64" />
+        <register type="NOA" address="0x00009888" value="0x4F800000" />
+        <register type="NOA" address="0x00009888" value="0x41800C02" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x70800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x0000C000" />
+        <register type="OA" address="0x00002774" value="0x0000E7FF" />
+        <register type="OA" address="0x00002778" value="0x00003000" />
+        <register type="OA" address="0x0000277C" value="0x0000F9FF" />
+        <register type="OA" address="0x00002780" value="0x00000C00" />
+        <register type="OA" address="0x00002784" value="0x0000FE7F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set TDL_1"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="tdl_1"
+       hw_config_guid="729fc3f4-ccff-4902-be6b-f1a22cc92c02"
+       chipset="BDW"
+       symbol_name="TDL_1"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice1 Subslice1"
+             description="The percentage of time in which PS thread is ready for dispatch on slice1 subslice1 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread11_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread11ReadyForDispatch"
+             availability="$SubsliceMask 0x10 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="NonPS Thread Ready For Dispatch on Slice1 Subslice2"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice1 subslice2 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread12_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread12ReadyForDispatch"
+             availability="$SubsliceMask 0x20 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="NonPS Thread Ready For Dispatch on Slice1 Subslice0"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice1 subslice0 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread10_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread10ReadyForDispatch"
+             availability="$SubsliceMask 0x8 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice1 Port 0"
+             description="The percentage of time in which thread header is ready on slice0 subslice1 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header01_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader01ReadyPort0"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice1 Port 1"
+             description="The percentage of time in which thread header is ready on slice0 subslice1 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header01_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader01ReadyPort1"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice2 Port 1"
+             description="The percentage of time in which thread header is ready on slice0 subslice2 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header02_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader02ReadyPort1"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice2 Port 0"
+             description="The percentage of time in which thread header is ready on slice0 subslice2 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header02_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader02ReadyPort0"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice1 Subslice2"
+             description="The percentage of time in which PS thread is ready for dispatch on slice1 subslice2 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread12_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread12ReadyForDispatch"
+             availability="$SubsliceMask 0x20 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice1 Subslice0"
+             description="The percentage of time in which PS thread is ready for dispatch on slice1 subslice0 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread10_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread10ReadyForDispatch"
+             availability="$SubsliceMask 0x8 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="NonPS Thread Ready For Dispatch on Slice1 Subslice1"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice1 subslice1 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread11_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread11ReadyForDispatch"
+             availability="$SubsliceMask 0x10 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL 2 UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice0 Port 0"
+             description="The percentage of time in which thread header is ready on slice0 subslice0 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header00_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader00ReadyPort0"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice0 Port 1"
+             description="The percentage of time in which thread header is ready on slice0 subslice0 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header00_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader00ReadyPort1"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x16154D60" />
+        <register type="NOA" address="0x00009888" value="0x16352E60" />
+        <register type="NOA" address="0x00009888" value="0x16554D60" />
+        <register type="NOA" address="0x00009888" value="0x16950000" />
+        <register type="NOA" address="0x00009888" value="0x16B50000" />
+        <register type="NOA" address="0x00009888" value="0x16D50000" />
+        <register type="NOA" address="0x00009888" value="0x005C8000" />
+        <register type="NOA" address="0x00009888" value="0x045CC000" />
+        <register type="NOA" address="0x00009888" value="0x065C4000" />
+        <register type="NOA" address="0x00009888" value="0x083D8000" />
+        <register type="NOA" address="0x00009888" value="0x0A3D8000" />
+        <register type="NOA" address="0x00009888" value="0x0458C000" />
+        <register type="NOA" address="0x00009888" value="0x025B8000" />
+        <register type="NOA" address="0x00009888" value="0x085B4000" />
+        <register type="NOA" address="0x00009888" value="0x0A5B4000" />
+        <register type="NOA" address="0x00009888" value="0x0C5B8000" />
+        <register type="NOA" address="0x00009888" value="0x0C1FA000" />
+        <register type="NOA" address="0x00009888" value="0x0E1F00AA" />
+        <register type="NOA" address="0x00009888" value="0x02384000" />
+        <register type="NOA" address="0x00009888" value="0x04388000" />
+        <register type="NOA" address="0x00009888" value="0x06388000" />
+        <register type="NOA" address="0x00009888" value="0x08384000" />
+        <register type="NOA" address="0x00009888" value="0x0A384000" />
+        <register type="NOA" address="0x00009888" value="0x0C384000" />
+        <register type="NOA" address="0x00009888" value="0x00398000" />
+        <register type="NOA" address="0x00009888" value="0x0239A000" />
+        <register type="NOA" address="0x00009888" value="0x0439A000" />
+        <register type="NOA" address="0x00009888" value="0x06392000" />
+        <register type="NOA" address="0x00009888" value="0x043A8000" />
+        <register type="NOA" address="0x00009888" value="0x063A8000" />
+        <register type="NOA" address="0x00009888" value="0x08138000" />
+        <register type="NOA" address="0x00009888" value="0x0A138000" />
+        <register type="NOA" address="0x00009888" value="0x06143000" />
+        <register type="NOA" address="0x00009888" value="0x0415CFC7" />
+        <register type="NOA" address="0x00009888" value="0x10150000" />
+        <register type="NOA" address="0x00009888" value="0x02338000" />
+        <register type="NOA" address="0x00009888" value="0x0C338000" />
+        <register type="NOA" address="0x00009888" value="0x04342000" />
+        <register type="NOA" address="0x00009888" value="0x06344000" />
+        <register type="NOA" address="0x00009888" value="0x0035C700" />
+        <register type="NOA" address="0x00009888" value="0x063500CF" />
+        <register type="NOA" address="0x00009888" value="0x10350000" />
+        <register type="NOA" address="0x00009888" value="0x04538000" />
+        <register type="NOA" address="0x00009888" value="0x06538000" />
+        <register type="NOA" address="0x00009888" value="0x0454C000" />
+        <register type="NOA" address="0x00009888" value="0x0255CFC7" />
+        <register type="NOA" address="0x00009888" value="0x10550000" />
+        <register type="NOA" address="0x00009888" value="0x06DC8000" />
+        <register type="NOA" address="0x00009888" value="0x08DC4000" />
+        <register type="NOA" address="0x00009888" value="0x0CDCC000" />
+        <register type="NOA" address="0x00009888" value="0x0EDCC000" />
+        <register type="NOA" address="0x00009888" value="0x1ABD00A8" />
+        <register type="NOA" address="0x00009888" value="0x0CD8C000" />
+        <register type="NOA" address="0x00009888" value="0x0ED84000" />
+        <register type="NOA" address="0x00009888" value="0x0EDB8000" />
+        <register type="NOA" address="0x00009888" value="0x18DB0800" />
+        <register type="NOA" address="0x00009888" value="0x1ADB0254" />
+        <register type="NOA" address="0x00009888" value="0x0E9FAA00" />
+        <register type="NOA" address="0x00009888" value="0x109F02AA" />
+        <register type="NOA" address="0x00009888" value="0x0EB84000" />
+        <register type="NOA" address="0x00009888" value="0x16B84000" />
+        <register type="NOA" address="0x00009888" value="0x18B8156A" />
+        <register type="NOA" address="0x00009888" value="0x06B98000" />
+        <register type="NOA" address="0x00009888" value="0x08B9A000" />
+        <register type="NOA" address="0x00009888" value="0x0AB9A000" />
+        <register type="NOA" address="0x00009888" value="0x0CB9A000" />
+        <register type="NOA" address="0x00009888" value="0x0EB9A000" />
+        <register type="NOA" address="0x00009888" value="0x18BAA000" />
+        <register type="NOA" address="0x00009888" value="0x1ABA0002" />
+        <register type="NOA" address="0x00009888" value="0x16934000" />
+        <register type="NOA" address="0x00009888" value="0x1893000A" />
+        <register type="NOA" address="0x00009888" value="0x0A947000" />
+        <register type="NOA" address="0x00009888" value="0x0C95C5C1" />
+        <register type="NOA" address="0x00009888" value="0x0E9500C3" />
+        <register type="NOA" address="0x00009888" value="0x10950000" />
+        <register type="NOA" address="0x00009888" value="0x0EB38000" />
+        <register type="NOA" address="0x00009888" value="0x16B30040" />
+        <register type="NOA" address="0x00009888" value="0x18B30020" />
+        <register type="NOA" address="0x00009888" value="0x06B48000" />
+        <register type="NOA" address="0x00009888" value="0x08B41000" />
+        <register type="NOA" address="0x00009888" value="0x0AB48000" />
+        <register type="NOA" address="0x00009888" value="0x06B5C500" />
+        <register type="NOA" address="0x00009888" value="0x08B500C3" />
+        <register type="NOA" address="0x00009888" value="0x0EB5C100" />
+        <register type="NOA" address="0x00009888" value="0x10B50000" />
+        <register type="NOA" address="0x00009888" value="0x16D31500" />
+        <register type="NOA" address="0x00009888" value="0x08D4E000" />
+        <register type="NOA" address="0x00009888" value="0x08D5C100" />
+        <register type="NOA" address="0x00009888" value="0x0AD5C3C5" />
+        <register type="NOA" address="0x00009888" value="0x10D50000" />
+        <register type="NOA" address="0x00009888" value="0x0D88F800" />
+        <register type="NOA" address="0x00009888" value="0x0F88000F" />
+        <register type="NOA" address="0x00009888" value="0x038A8000" />
+        <register type="NOA" address="0x00009888" value="0x058A8000" />
+        <register type="NOA" address="0x00009888" value="0x078A8000" />
+        <register type="NOA" address="0x00009888" value="0x098A8000" />
+        <register type="NOA" address="0x00009888" value="0x0B8A8000" />
+        <register type="NOA" address="0x00009888" value="0x0D8A8000" />
+        <register type="NOA" address="0x00009888" value="0x258BAAA5" />
+        <register type="NOA" address="0x00009888" value="0x278B002A" />
+        <register type="NOA" address="0x00009888" value="0x238B2A80" />
+        <register type="NOA" address="0x00009888" value="0x0F8C4000" />
+        <register type="NOA" address="0x00009888" value="0x178C2000" />
+        <register type="NOA" address="0x00009888" value="0x198C5500" />
+        <register type="NOA" address="0x00009888" value="0x1B8C0015" />
+        <register type="NOA" address="0x00009888" value="0x078D8000" />
+        <register type="NOA" address="0x00009888" value="0x098DA000" />
+        <register type="NOA" address="0x00009888" value="0x0B8DA000" />
+        <register type="NOA" address="0x00009888" value="0x0D8DA000" />
+        <register type="NOA" address="0x00009888" value="0x0F8DA000" />
+        <register type="NOA" address="0x00009888" value="0x2185AAAA" />
+        <register type="NOA" address="0x00009888" value="0x2385002A" />
+        <register type="NOA" address="0x00009888" value="0x1F85AA00" />
+        <register type="NOA" address="0x00009888" value="0x0F834000" />
+        <register type="NOA" address="0x00009888" value="0x19835400" />
+        <register type="NOA" address="0x00009888" value="0x1B830155" />
+        <register type="NOA" address="0x00009888" value="0x03834000" />
+        <register type="NOA" address="0x00009888" value="0x05834000" />
+        <register type="NOA" address="0x00009888" value="0x07834000" />
+        <register type="NOA" address="0x00009888" value="0x09834000" />
+        <register type="NOA" address="0x00009888" value="0x0B834000" />
+        <register type="NOA" address="0x00009888" value="0x0D834000" />
+        <register type="NOA" address="0x00009888" value="0x0784C000" />
+        <register type="NOA" address="0x00009888" value="0x0984C000" />
+        <register type="NOA" address="0x00009888" value="0x0B84C000" />
+        <register type="NOA" address="0x00009888" value="0x0D84C000" />
+        <register type="NOA" address="0x00009888" value="0x0F84C000" />
+        <register type="NOA" address="0x00009888" value="0x01848000" />
+        <register type="NOA" address="0x00009888" value="0x0384C000" />
+        <register type="NOA" address="0x00009888" value="0x0584C000" />
+        <register type="NOA" address="0x00009888" value="0x1780C000" />
+        <register type="NOA" address="0x00009888" value="0x1980C000" />
+        <register type="NOA" address="0x00009888" value="0x1B80C000" />
+        <register type="NOA" address="0x00009888" value="0x1D80C000" />
+        <register type="NOA" address="0x00009888" value="0x1F80C000" />
+        <register type="NOA" address="0x00009888" value="0x11808000" />
+        <register type="NOA" address="0x00009888" value="0x1380C000" />
+        <register type="NOA" address="0x00009888" value="0x1580C000" />
+        <register type="NOA" address="0x00009888" value="0x4F800000" />
+        <register type="NOA" address="0x00009888" value="0x43800C42" />
+        <register type="NOA" address="0x00009888" value="0x51800000" />
+        <register type="NOA" address="0x00009888" value="0x45800063" />
+        <register type="NOA" address="0x00009888" value="0x53800000" />
+        <register type="NOA" address="0x00009888" value="0x47800800" />
+        <register type="NOA" address="0x00009888" value="0x21800000" />
+        <register type="NOA" address="0x00009888" value="0x31800000" />
+        <register type="NOA" address="0x00009888" value="0x4D800000" />
+        <register type="NOA" address="0x00009888" value="0x3F8014A4" />
+        <register type="NOA" address="0x00009888" value="0x41801042" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x30800000" />
+        <register type="OA" address="0x00002770" value="0x00000002" />
+        <register type="OA" address="0x00002774" value="0x0000FDFF" />
+        <register type="OA" address="0x00002778" value="0x00000000" />
+        <register type="OA" address="0x0000277C" value="0x0000FE7F" />
+        <register type="OA" address="0x00002780" value="0x00000002" />
+        <register type="OA" address="0x00002784" value="0x0000FFBF" />
+        <register type="OA" address="0x00002788" value="0x00000000" />
+        <register type="OA" address="0x0000278C" value="0x0000FFCF" />
+        <register type="OA" address="0x00002790" value="0x00000002" />
+        <register type="OA" address="0x00002794" value="0x0000FFF7" />
+        <register type="OA" address="0x00002798" value="0x00000000" />
+        <register type="OA" address="0x0000279C" value="0x0000FFF9" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set TDL_2"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="tdl_2"
+       hw_config_guid="29598975-4785-43ab-a981-1dfa58d0e835"
+       chipset="BDW"
+       symbol_name="TDL_2"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Thread Header Ready on Slice1 Subslice1 Port 1"
+             description="The percentage of time in which thread header is ready on slice1 subslice1 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header11_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader11ReadyPort1"
+             availability="$SubsliceMask 0x10 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="NonPS Thread Ready For Dispatch on Slice0 Subslice2"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice2 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread02_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread02ReadyForDispatch"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="NonPS Thread Ready For Dispatch on Slice0 Subslice0"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice0 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread00_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread00ReadyForDispatch"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Thread Header Ready on Slice1 Subslice1 Port 0"
+             description="The percentage of time in which thread header is ready on slice1 subslice1 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header11_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader11ReadyPort0"
+             availability="$SubsliceMask 0x10 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Thread Header Ready on Slice1 Subslice2 Port 0"
+             description="The percentage of time in which thread header is ready on slice1 subslice2 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header12_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader12ReadyPort0"
+             availability="$SubsliceMask 0x20 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Subslice0"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice0 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread00_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread00ReadyForDispatch"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Thread Header Ready on Slice1 Subslice0 Port 1"
+             description="The percentage of time in which thread header is ready on slice1 subslice0 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header10_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader10ReadyPort1"
+             availability="$SubsliceMask 0x8 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Subslice1"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice1 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread01_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread01ReadyForDispatch"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Thread Header Ready on Slice1 Subslice2 Port 1"
+             description="The percentage of time in which thread header is ready on slice1 subslice2 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header12_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader12ReadyPort1"
+             availability="$SubsliceMask 0x20 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Subslice2"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice2 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread02_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread02ReadyForDispatch"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL 2 UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Thread Header Ready on Slice1 Subslice0 Port 0"
+             description="The percentage of time in which thread header is ready on slice1 subslice0 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header10_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader10ReadyPort0"
+             availability="$SubsliceMask 0x8 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="NonPS Thread Ready For Dispatch on Slice0 Subslice1"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice1 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread01_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread01ReadyForDispatch"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x16150000" />
+        <register type="NOA" address="0x00009888" value="0x16350000" />
+        <register type="NOA" address="0x00009888" value="0x16550000" />
+        <register type="NOA" address="0x00009888" value="0x16952E60" />
+        <register type="NOA" address="0x00009888" value="0x16B54D60" />
+        <register type="NOA" address="0x00009888" value="0x16D52E60" />
+        <register type="NOA" address="0x00009888" value="0x065C8000" />
+        <register type="NOA" address="0x00009888" value="0x085CC000" />
+        <register type="NOA" address="0x00009888" value="0x0A5CC000" />
+        <register type="NOA" address="0x00009888" value="0x0C5C4000" />
+        <register type="NOA" address="0x00009888" value="0x0E3D8000" />
+        <register type="NOA" address="0x00009888" value="0x183DA000" />
+        <register type="NOA" address="0x00009888" value="0x06588000" />
+        <register type="NOA" address="0x00009888" value="0x08588000" />
+        <register type="NOA" address="0x00009888" value="0x0A584000" />
+        <register type="NOA" address="0x00009888" value="0x0E5B4000" />
+        <register type="NOA" address="0x00009888" value="0x185B5800" />
+        <register type="NOA" address="0x00009888" value="0x1A5B000A" />
+        <register type="NOA" address="0x00009888" value="0x0E1FAA00" />
+        <register type="NOA" address="0x00009888" value="0x101F02AA" />
+        <register type="NOA" address="0x00009888" value="0x0E384000" />
+        <register type="NOA" address="0x00009888" value="0x16384000" />
+        <register type="NOA" address="0x00009888" value="0x18382A55" />
+        <register type="NOA" address="0x00009888" value="0x06398000" />
+        <register type="NOA" address="0x00009888" value="0x0839A000" />
+        <register type="NOA" address="0x00009888" value="0x0A39A000" />
+        <register type="NOA" address="0x00009888" value="0x0C39A000" />
+        <register type="NOA" address="0x00009888" value="0x0E39A000" />
+        <register type="NOA" address="0x00009888" value="0x1A3A02A0" />
+        <register type="NOA" address="0x00009888" value="0x0E138000" />
+        <register type="NOA" address="0x00009888" value="0x16130500" />
+        <register type="NOA" address="0x00009888" value="0x06148000" />
+        <register type="NOA" address="0x00009888" value="0x08146000" />
+        <register type="NOA" address="0x00009888" value="0x0615C100" />
+        <register type="NOA" address="0x00009888" value="0x0815C500" />
+        <register type="NOA" address="0x00009888" value="0x0A1500C3" />
+        <register type="NOA" address="0x00009888" value="0x10150000" />
+        <register type="NOA" address="0x00009888" value="0x16335040" />
+        <register type="NOA" address="0x00009888" value="0x08349000" />
+        <register type="NOA" address="0x00009888" value="0x0A341000" />
+        <register type="NOA" address="0x00009888" value="0x083500C1" />
+        <register type="NOA" address="0x00009888" value="0x0A35C500" />
+        <register type="NOA" address="0x00009888" value="0x0C3500C3" />
+        <register type="NOA" address="0x00009888" value="0x10350000" />
+        <register type="NOA" address="0x00009888" value="0x1853002A" />
+        <register type="NOA" address="0x00009888" value="0x0A54E000" />
+        <register type="NOA" address="0x00009888" value="0x0C55C500" />
+        <register type="NOA" address="0x00009888" value="0x0E55C1C3" />
+        <register type="NOA" address="0x00009888" value="0x10550000" />
+        <register type="NOA" address="0x00009888" value="0x00DC8000" />
+        <register type="NOA" address="0x00009888" value="0x02DCC000" />
+        <register type="NOA" address="0x00009888" value="0x04DC4000" />
+        <register type="NOA" address="0x00009888" value="0x04BD8000" />
+        <register type="NOA" address="0x00009888" value="0x06BD8000" />
+        <register type="NOA" address="0x00009888" value="0x02D8C000" />
+        <register type="NOA" address="0x00009888" value="0x02DB8000" />
+        <register type="NOA" address="0x00009888" value="0x04DB4000" />
+        <register type="NOA" address="0x00009888" value="0x06DB4000" />
+        <register type="NOA" address="0x00009888" value="0x08DB8000" />
+        <register type="NOA" address="0x00009888" value="0x0C9FA000" />
+        <register type="NOA" address="0x00009888" value="0x0E9F00AA" />
+        <register type="NOA" address="0x00009888" value="0x02B84000" />
+        <register type="NOA" address="0x00009888" value="0x04B84000" />
+        <register type="NOA" address="0x00009888" value="0x06B84000" />
+        <register type="NOA" address="0x00009888" value="0x08B84000" />
+        <register type="NOA" address="0x00009888" value="0x0AB88000" />
+        <register type="NOA" address="0x00009888" value="0x0CB88000" />
+        <register type="NOA" address="0x00009888" value="0x00B98000" />
+        <register type="NOA" address="0x00009888" value="0x02B9A000" />
+        <register type="NOA" address="0x00009888" value="0x04B9A000" />
+        <register type="NOA" address="0x00009888" value="0x06B92000" />
+        <register type="NOA" address="0x00009888" value="0x0ABA8000" />
+        <register type="NOA" address="0x00009888" value="0x0CBA8000" />
+        <register type="NOA" address="0x00009888" value="0x04938000" />
+        <register type="NOA" address="0x00009888" value="0x06938000" />
+        <register type="NOA" address="0x00009888" value="0x0494C000" />
+        <register type="NOA" address="0x00009888" value="0x0295CFC7" />
+        <register type="NOA" address="0x00009888" value="0x10950000" />
+        <register type="NOA" address="0x00009888" value="0x02B38000" />
+        <register type="NOA" address="0x00009888" value="0x08B38000" />
+        <register type="NOA" address="0x00009888" value="0x04B42000" />
+        <register type="NOA" address="0x00009888" value="0x06B41000" />
+        <register type="NOA" address="0x00009888" value="0x00B5C700" />
+        <register type="NOA" address="0x00009888" value="0x04B500CF" />
+        <register type="NOA" address="0x00009888" value="0x10B50000" />
+        <register type="NOA" address="0x00009888" value="0x0AD38000" />
+        <register type="NOA" address="0x00009888" value="0x0CD38000" />
+        <register type="NOA" address="0x00009888" value="0x06D46000" />
+        <register type="NOA" address="0x00009888" value="0x04D5C700" />
+        <register type="NOA" address="0x00009888" value="0x06D500CF" />
+        <register type="NOA" address="0x00009888" value="0x10D50000" />
+        <register type="NOA" address="0x00009888" value="0x03888000" />
+        <register type="NOA" address="0x00009888" value="0x05888000" />
+        <register type="NOA" address="0x00009888" value="0x07888000" />
+        <register type="NOA" address="0x00009888" value="0x09888000" />
+        <register type="NOA" address="0x00009888" value="0x0B888000" />
+        <register type="NOA" address="0x00009888" value="0x0D880400" />
+        <register type="NOA" address="0x00009888" value="0x0F8A8000" />
+        <register type="NOA" address="0x00009888" value="0x198A8000" />
+        <register type="NOA" address="0x00009888" value="0x1B8AAAA0" />
+        <register type="NOA" address="0x00009888" value="0x1D8A0002" />
+        <register type="NOA" address="0x00009888" value="0x258B555A" />
+        <register type="NOA" address="0x00009888" value="0x278B0015" />
+        <register type="NOA" address="0x00009888" value="0x238B5500" />
+        <register type="NOA" address="0x00009888" value="0x038C4000" />
+        <register type="NOA" address="0x00009888" value="0x058C4000" />
+        <register type="NOA" address="0x00009888" value="0x078C4000" />
+        <register type="NOA" address="0x00009888" value="0x098C4000" />
+        <register type="NOA" address="0x00009888" value="0x0B8C4000" />
+        <register type="NOA" address="0x00009888" value="0x0D8C4000" />
+        <register type="NOA" address="0x00009888" value="0x018D8000" />
+        <register type="NOA" address="0x00009888" value="0x038DA000" />
+        <register type="NOA" address="0x00009888" value="0x058DA000" />
+        <register type="NOA" address="0x00009888" value="0x078D2000" />
+        <register type="NOA" address="0x00009888" value="0x2185AAAA" />
+        <register type="NOA" address="0x00009888" value="0x2385002A" />
+        <register type="NOA" address="0x00009888" value="0x1F85AA00" />
+        <register type="NOA" address="0x00009888" value="0x0F834000" />
+        <register type="NOA" address="0x00009888" value="0x19835400" />
+        <register type="NOA" address="0x00009888" value="0x1B830155" />
+        <register type="NOA" address="0x00009888" value="0x03834000" />
+        <register type="NOA" address="0x00009888" value="0x05834000" />
+        <register type="NOA" address="0x00009888" value="0x07834000" />
+        <register type="NOA" address="0x00009888" value="0x09834000" />
+        <register type="NOA" address="0x00009888" value="0x0B834000" />
+        <register type="NOA" address="0x00009888" value="0x0D834000" />
+        <register type="NOA" address="0x00009888" value="0x0784C000" />
+        <register type="NOA" address="0x00009888" value="0x0984C000" />
+        <register type="NOA" address="0x00009888" value="0x0B84C000" />
+        <register type="NOA" address="0x00009888" value="0x0D84C000" />
+        <register type="NOA" address="0x00009888" value="0x0F84C000" />
+        <register type="NOA" address="0x00009888" value="0x01848000" />
+        <register type="NOA" address="0x00009888" value="0x0384C000" />
+        <register type="NOA" address="0x00009888" value="0x0584C000" />
+        <register type="NOA" address="0x00009888" value="0x1780C000" />
+        <register type="NOA" address="0x00009888" value="0x1980C000" />
+        <register type="NOA" address="0x00009888" value="0x1B80C000" />
+        <register type="NOA" address="0x00009888" value="0x1D80C000" />
+        <register type="NOA" address="0x00009888" value="0x1F80C000" />
+        <register type="NOA" address="0x00009888" value="0x11808000" />
+        <register type="NOA" address="0x00009888" value="0x1380C000" />
+        <register type="NOA" address="0x00009888" value="0x1580C000" />
+        <register type="NOA" address="0x00009888" value="0x4F800000" />
+        <register type="NOA" address="0x00009888" value="0x43800882" />
+        <register type="NOA" address="0x00009888" value="0x51800000" />
+        <register type="NOA" address="0x00009888" value="0x45801082" />
+        <register type="NOA" address="0x00009888" value="0x53800000" />
+        <register type="NOA" address="0x00009888" value="0x478014A5" />
+        <register type="NOA" address="0x00009888" value="0x21800000" />
+        <register type="NOA" address="0x00009888" value="0x31800000" />
+        <register type="NOA" address="0x00009888" value="0x4D800000" />
+        <register type="NOA" address="0x00009888" value="0x3F800002" />
+        <register type="NOA" address="0x00009888" value="0x41800C62" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x30800000" />
+        <register type="OA" address="0x00002770" value="0x00000002" />
+        <register type="OA" address="0x00002774" value="0x0000FDFF" />
+        <register type="OA" address="0x00002778" value="0x00000000" />
+        <register type="OA" address="0x0000277C" value="0x0000FE7F" />
+        <register type="OA" address="0x00002780" value="0x00000000" />
+        <register type="OA" address="0x00002784" value="0x0000FF9F" />
+        <register type="OA" address="0x00002788" value="0x00000000" />
+        <register type="OA" address="0x0000278C" value="0x0000FFE7" />
+        <register type="OA" address="0x00002790" value="0x00000002" />
+        <register type="OA" address="0x00002794" value="0x0000FFFB" />
+        <register type="OA" address="0x00002798" value="0x00000002" />
+        <register type="OA" address="0x0000279C" value="0x0000FFFD" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Compute Metrics Extra Gen8"
+       mdapi_supported_apis="VK OGL4 OCL IO BB"
+       underscore_name="compute_extra"
+       hw_config_guid="8fb61ba2-2fbb-454c-a136-2dec5a8a595e"
+       chipset="BDW"
+       symbol_name="ComputeExtra"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active"
+             units="percent"
+             symbol_name="Fpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Pipe Active including Ext Math"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing including Extended Math processing"
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ  C 5 READ C 6 READ FADD C 7 READ FADD C 2 READ FADD C 3 READ FADD C 4 READ FADD 8 FMUL FADD 100 FMUL $EuCoresTotalCount FDIV $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active_adjusted"
+             units="percent"
+             symbol_name="Fpu1ActiveAdjusted"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x161503E0" />
+        <register type="NOA" address="0x00009888" value="0x163503E0" />
+        <register type="NOA" address="0x00009888" value="0x165503E0" />
+        <register type="NOA" address="0x00009888" value="0x169503E0" />
+        <register type="NOA" address="0x00009888" value="0x16B503E0" />
+        <register type="NOA" address="0x00009888" value="0x16D503E0" />
+        <register type="NOA" address="0x00009888" value="0x045CC000" />
+        <register type="NOA" address="0x00009888" value="0x083D8000" />
+        <register type="NOA" address="0x00009888" value="0x04584000" />
+        <register type="NOA" address="0x00009888" value="0x085B4000" />
+        <register type="NOA" address="0x00009888" value="0x0A5B8000" />
+        <register type="NOA" address="0x00009888" value="0x0E1F00A8" />
+        <register type="NOA" address="0x00009888" value="0x08384000" />
+        <register type="NOA" address="0x00009888" value="0x0A384000" />
+        <register type="NOA" address="0x00009888" value="0x0C388000" />
+        <register type="NOA" address="0x00009888" value="0x0439A000" />
+        <register type="NOA" address="0x00009888" value="0x06392000" />
+        <register type="NOA" address="0x00009888" value="0x0C3A8000" />
+        <register type="NOA" address="0x00009888" value="0x08138000" />
+        <register type="NOA" address="0x00009888" value="0x06141000" />
+        <register type="NOA" address="0x00009888" value="0x041500C3" />
+        <register type="NOA" address="0x00009888" value="0x10150000" />
+        <register type="NOA" address="0x00009888" value="0x0A338000" />
+        <register type="NOA" address="0x00009888" value="0x06342000" />
+        <register type="NOA" address="0x00009888" value="0x0435C300" />
+        <register type="NOA" address="0x00009888" value="0x10350000" />
+        <register type="NOA" address="0x00009888" value="0x0C538000" />
+        <register type="NOA" address="0x00009888" value="0x06544000" />
+        <register type="NOA" address="0x00009888" value="0x065500C3" />
+        <register type="NOA" address="0x00009888" value="0x10550000" />
+        <register type="NOA" address="0x00009888" value="0x00DC8000" />
+        <register type="NOA" address="0x00009888" value="0x02DC4000" />
+        <register type="NOA" address="0x00009888" value="0x02BD8000" />
+        <register type="NOA" address="0x00009888" value="0x00D88000" />
+        <register type="NOA" address="0x00009888" value="0x02DB4000" />
+        <register type="NOA" address="0x00009888" value="0x04DB8000" />
+        <register type="NOA" address="0x00009888" value="0x0C9FA000" />
+        <register type="NOA" address="0x00009888" value="0x0E9F0002" />
+        <register type="NOA" address="0x00009888" value="0x02B84000" />
+        <register type="NOA" address="0x00009888" value="0x04B84000" />
+        <register type="NOA" address="0x00009888" value="0x06B88000" />
+        <register type="NOA" address="0x00009888" value="0x00B98000" />
+        <register type="NOA" address="0x00009888" value="0x02B9A000" />
+        <register type="NOA" address="0x00009888" value="0x06BA8000" />
+        <register type="NOA" address="0x00009888" value="0x02938000" />
+        <register type="NOA" address="0x00009888" value="0x04942000" />
+        <register type="NOA" address="0x00009888" value="0x0095C300" />
+        <register type="NOA" address="0x00009888" value="0x10950000" />
+        <register type="NOA" address="0x00009888" value="0x04B38000" />
+        <register type="NOA" address="0x00009888" value="0x04B44000" />
+        <register type="NOA" address="0x00009888" value="0x02B500C3" />
+        <register type="NOA" address="0x00009888" value="0x10B50000" />
+        <register type="NOA" address="0x00009888" value="0x06D38000" />
+        <register type="NOA" address="0x00009888" value="0x04D48000" />
+        <register type="NOA" address="0x00009888" value="0x02D5C300" />
+        <register type="NOA" address="0x00009888" value="0x10D50000" />
+        <register type="NOA" address="0x00009888" value="0x03888000" />
+        <register type="NOA" address="0x00009888" value="0x05888000" />
+        <register type="NOA" address="0x00009888" value="0x07888000" />
+        <register type="NOA" address="0x00009888" value="0x098A8000" />
+        <register type="NOA" address="0x00009888" value="0x0B8A8000" />
+        <register type="NOA" address="0x00009888" value="0x0D8A8000" />
+        <register type="NOA" address="0x00009888" value="0x238B3500" />
+        <register type="NOA" address="0x00009888" value="0x258B0005" />
+        <register type="NOA" address="0x00009888" value="0x038C4000" />
+        <register type="NOA" address="0x00009888" value="0x058C4000" />
+        <register type="NOA" address="0x00009888" value="0x078C4000" />
+        <register type="NOA" address="0x00009888" value="0x018D8000" />
+        <register type="NOA" address="0x00009888" value="0x038DA000" />
+        <register type="NOA" address="0x00009888" value="0x1F85AA00" />
+        <register type="NOA" address="0x00009888" value="0x2185000A" />
+        <register type="NOA" address="0x00009888" value="0x03834000" />
+        <register type="NOA" address="0x00009888" value="0x05834000" />
+        <register type="NOA" address="0x00009888" value="0x07834000" />
+        <register type="NOA" address="0x00009888" value="0x09834000" />
+        <register type="NOA" address="0x00009888" value="0x0B834000" />
+        <register type="NOA" address="0x00009888" value="0x0D834000" />
+        <register type="NOA" address="0x00009888" value="0x01848000" />
+        <register type="NOA" address="0x00009888" value="0x0384C000" />
+        <register type="NOA" address="0x00009888" value="0x0584C000" />
+        <register type="NOA" address="0x00009888" value="0x07844000" />
+        <register type="NOA" address="0x00009888" value="0x11808000" />
+        <register type="NOA" address="0x00009888" value="0x1380C000" />
+        <register type="NOA" address="0x00009888" value="0x1580C000" />
+        <register type="NOA" address="0x00009888" value="0x17804000" />
+        <register type="NOA" address="0x00009888" value="0x21800000" />
+        <register type="NOA" address="0x00009888" value="0x4D800000" />
+        <register type="NOA" address="0x00009888" value="0x3F800C40" />
+        <register type="NOA" address="0x00009888" value="0x4F800000" />
+        <register type="NOA" address="0x00009888" value="0x41801482" />
+        <register type="NOA" address="0x00009888" value="0x31800000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00001000" />
+        <register type="FLEX" address="0x0000E558" value="0x00003002" />
+        <register type="FLEX" address="0x0000E658" value="0x00005004" />
+        <register type="FLEX" address="0x0000E758" value="0x00011010" />
+        <register type="FLEX" address="0x0000E45C" value="0x00050012" />
+        <register type="FLEX" address="0x0000E55C" value="0x00052051" />
+        <register type="FLEX" address="0x0000E65C" value="0x00000008" />
+    </register_config>
+  </set>
+
+  <set name="Media Vme Pipe Gen8"
+       mdapi_supported_apis="MEDIA IO BB"
+       underscore_name="vme_pipe"
+       hw_config_guid="e1743ca0-7fc8-410b-a066-de7bbb9280b7"
+       chipset="BDW"
+       symbol_name="VMEPipe"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="EU Thread Occupancy"
+             description="The percentage of time in which hardware threads occupied EUs."
+             data_type="float"
+             max_equation="100"
+             equation="8 A 10 READ FMUL $EuThreadsCount FDIV $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_thread_occupancy"
+             units="percent"
+             symbol_name="EuThreadOccupancy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VME Busy"
+             description="The percentage of time in which VME (IME or CRE) was actively processing data."
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ B 3 READ FADD 2 FDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vme_busy"
+             units="percent"
+             symbol_name="VMEBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Overview System Batch Tier2"
+             mdapi_group="VME Pipe"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x14100812" />
+        <register type="NOA" address="0x00009888" value="0x14125800" />
+        <register type="NOA" address="0x00009888" value="0x161200C0" />
+        <register type="NOA" address="0x00009888" value="0x14300812" />
+        <register type="NOA" address="0x00009888" value="0x14325800" />
+        <register type="NOA" address="0x00009888" value="0x163200C0" />
+        <register type="NOA" address="0x00009888" value="0x005C4000" />
+        <register type="NOA" address="0x00009888" value="0x065C8000" />
+        <register type="NOA" address="0x00009888" value="0x085CC000" />
+        <register type="NOA" address="0x00009888" value="0x0A5CC000" />
+        <register type="NOA" address="0x00009888" value="0x0C5CC000" />
+        <register type="NOA" address="0x00009888" value="0x003D8000" />
+        <register type="NOA" address="0x00009888" value="0x0E3D8000" />
+        <register type="NOA" address="0x00009888" value="0x183D2800" />
+        <register type="NOA" address="0x00009888" value="0x00584000" />
+        <register type="NOA" address="0x00009888" value="0x06588000" />
+        <register type="NOA" address="0x00009888" value="0x0858C000" />
+        <register type="NOA" address="0x00009888" value="0x005B4000" />
+        <register type="NOA" address="0x00009888" value="0x0E5B4000" />
+        <register type="NOA" address="0x00009888" value="0x185B9400" />
+        <register type="NOA" address="0x00009888" value="0x1A5B002A" />
+        <register type="NOA" address="0x00009888" value="0x0C1F0800" />
+        <register type="NOA" address="0x00009888" value="0x0E1FAA00" />
+        <register type="NOA" address="0x00009888" value="0x101F002A" />
+        <register type="NOA" address="0x00009888" value="0x00384000" />
+        <register type="NOA" address="0x00009888" value="0x0E384000" />
+        <register type="NOA" address="0x00009888" value="0x16384000" />
+        <register type="NOA" address="0x00009888" value="0x18380155" />
+        <register type="NOA" address="0x00009888" value="0x00392000" />
+        <register type="NOA" address="0x00009888" value="0x06398000" />
+        <register type="NOA" address="0x00009888" value="0x0839A000" />
+        <register type="NOA" address="0x00009888" value="0x0A39A000" />
+        <register type="NOA" address="0x00009888" value="0x0C39A000" />
+        <register type="NOA" address="0x00009888" value="0x00100047" />
+        <register type="NOA" address="0x00009888" value="0x06101A80" />
+        <register type="NOA" address="0x00009888" value="0x10100000" />
+        <register type="NOA" address="0x00009888" value="0x0810C000" />
+        <register type="NOA" address="0x00009888" value="0x0811C000" />
+        <register type="NOA" address="0x00009888" value="0x08126151" />
+        <register type="NOA" address="0x00009888" value="0x10120000" />
+        <register type="NOA" address="0x00009888" value="0x00134000" />
+        <register type="NOA" address="0x00009888" value="0x0E134000" />
+        <register type="NOA" address="0x00009888" value="0x161300A0" />
+        <register type="NOA" address="0x00009888" value="0x0A301AC7" />
+        <register type="NOA" address="0x00009888" value="0x10300000" />
+        <register type="NOA" address="0x00009888" value="0x0C30C000" />
+        <register type="NOA" address="0x00009888" value="0x0C31C000" />
+        <register type="NOA" address="0x00009888" value="0x0C326151" />
+        <register type="NOA" address="0x00009888" value="0x10320000" />
+        <register type="NOA" address="0x00009888" value="0x16332A00" />
+        <register type="NOA" address="0x00009888" value="0x18330001" />
+        <register type="NOA" address="0x00009888" value="0x018A8000" />
+        <register type="NOA" address="0x00009888" value="0x0F8A8000" />
+        <register type="NOA" address="0x00009888" value="0x198A8000" />
+        <register type="NOA" address="0x00009888" value="0x1B8A2AA0" />
+        <register type="NOA" address="0x00009888" value="0x238B0020" />
+        <register type="NOA" address="0x00009888" value="0x258B5550" />
+        <register type="NOA" address="0x00009888" value="0x278B0001" />
+        <register type="NOA" address="0x00009888" value="0x1F850080" />
+        <register type="NOA" address="0x00009888" value="0x2185AAA0" />
+        <register type="NOA" address="0x00009888" value="0x23850002" />
+        <register type="NOA" address="0x00009888" value="0x01834000" />
+        <register type="NOA" address="0x00009888" value="0x0F834000" />
+        <register type="NOA" address="0x00009888" value="0x19835400" />
+        <register type="NOA" address="0x00009888" value="0x1B830015" />
+        <register type="NOA" address="0x00009888" value="0x01844000" />
+        <register type="NOA" address="0x00009888" value="0x07848000" />
+        <register type="NOA" address="0x00009888" value="0x0984C000" />
+        <register type="NOA" address="0x00009888" value="0x0B84C000" />
+        <register type="NOA" address="0x00009888" value="0x0D84C000" />
+        <register type="NOA" address="0x00009888" value="0x11804000" />
+        <register type="NOA" address="0x00009888" value="0x17808000" />
+        <register type="NOA" address="0x00009888" value="0x1980C000" />
+        <register type="NOA" address="0x00009888" value="0x1B80C000" />
+        <register type="NOA" address="0x00009888" value="0x1D80C000" />
+        <register type="NOA" address="0x00009888" value="0x4D800000" />
+        <register type="NOA" address="0x00009888" value="0x3D800800" />
+        <register type="NOA" address="0x00009888" value="0x4F800000" />
+        <register type="NOA" address="0x00009888" value="0x43800002" />
+        <register type="NOA" address="0x00009888" value="0x51800000" />
+        <register type="NOA" address="0x00009888" value="0x45800884" />
+        <register type="NOA" address="0x00009888" value="0x53800000" />
+        <register type="NOA" address="0x00009888" value="0x47800002" />
+        <register type="NOA" address="0x00009888" value="0x21800000" />
+        <register type="NOA" address="0x00009888" value="0x31800000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x30800000" />
+        <register type="OA" address="0x00002770" value="0x00100030" />
+        <register type="OA" address="0x00002774" value="0x0000FFF9" />
+        <register type="OA" address="0x00002778" value="0x00000002" />
+        <register type="OA" address="0x0000277C" value="0x0000FFFC" />
+        <register type="OA" address="0x00002780" value="0x00000002" />
+        <register type="OA" address="0x00002784" value="0x0000FFF3" />
+        <register type="OA" address="0x00002788" value="0x00100180" />
+        <register type="OA" address="0x0000278C" value="0x0000FFCF" />
+        <register type="OA" address="0x00002790" value="0x00000002" />
+        <register type="OA" address="0x00002794" value="0x0000FFCF" />
+        <register type="OA" address="0x00002798" value="0x00000002" />
+        <register type="OA" address="0x0000279C" value="0x0000FF3F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00008003" />
+    </register_config>
+  </set>
+
+  <set name="Gpu Rings Busyness"
+       mdapi_supported_apis="VK OGL OCL MEDIA IO BB"
+       underscore_name="gpu_busyness"
+       hw_config_guid="0a9eb7be-feee-4275-a139-6d9cedf0fdb0"
+       chipset="BDW"
+       symbol_name="GpuBusyness"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="Vebox Ring Busy"
+             description="The percentage of time when vebox command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vebox_busy"
+             units="percent"
+             symbol_name="VeboxBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Render Ring Busy"
+             description="The percentage of time when render command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="render_busy"
+             units="percent"
+             symbol_name="RenderBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Vdbox0 Ring Busy"
+             description="The percentage of time when Vdbox0 command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vdbox0_busy"
+             units="percent"
+             symbol_name="Vdbox0Busy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Blitter Ring Busy"
+             description="The percentage of time when blitter command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="blitter_busy"
+             units="percent"
+             symbol_name="BlitterBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="AnyRingBusy"
+             description="The percentage of time when any command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="any_ring_busy"
+             units="percent"
+             symbol_name="AnyRingBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Vdbox1 Ring Busy"
+             description="The percentage of time when Vdbox1 command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vdbox1_busy"
+             units="percent"
+             symbol_name="Vdbox1Busy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x1AF00100" />
+        <register type="NOA" address="0x00009888" value="0x118B0000" />
+        <register type="NOA" address="0x00009888" value="0x11850008" />
+        <register type="NOA" address="0x00009888" value="0x17830100" />
+        <register type="NOA" address="0x00009888" value="0x1A700100" />
+        <register type="NOA" address="0x00009888" value="0x1D940040" />
+        <register type="NOA" address="0x00009888" value="0x02F00085" />
+        <register type="NOA" address="0x00009888" value="0x10F00000" />
+        <register type="NOA" address="0x00009888" value="0x24F00000" />
+        <register type="NOA" address="0x00009888" value="0x078B0003" />
+        <register type="NOA" address="0x00009888" value="0x238B0400" />
+        <register type="NOA" address="0x00009888" value="0x258B0000" />
+        <register type="NOA" address="0x00009888" value="0x058C8000" />
+        <register type="NOA" address="0x00009888" value="0x038D2000" />
+        <register type="NOA" address="0x00009888" value="0x03850500" />
+        <register type="NOA" address="0x00009888" value="0x1F858800" />
+        <register type="NOA" address="0x00009888" value="0x2185000A" />
+        <register type="NOA" address="0x00009888" value="0x05834055" />
+        <register type="NOA" address="0x00009888" value="0x11830000" />
+        <register type="NOA" address="0x00009888" value="0x09830000" />
+        <register type="NOA" address="0x00009888" value="0x0B838000" />
+        <register type="NOA" address="0x00009888" value="0x0D834000" />
+        <register type="NOA" address="0x00009888" value="0x03844000" />
+        <register type="NOA" address="0x00009888" value="0x0584C000" />
+        <register type="NOA" address="0x00009888" value="0x07844000" />
+        <register type="NOA" address="0x00009888" value="0x1380C000" />
+        <register type="NOA" address="0x00009888" value="0x1580C000" />
+        <register type="NOA" address="0x00009888" value="0x17804000" />
+        <register type="NOA" address="0x00009888" value="0x04708500" />
+        <register type="NOA" address="0x00009888" value="0x10700000" />
+        <register type="NOA" address="0x00009888" value="0x24700000" />
+        <register type="NOA" address="0x00009888" value="0x21800000" />
+        <register type="NOA" address="0x00009888" value="0x4D801000" />
+        <register type="NOA" address="0x00009888" value="0x3F800000" />
+        <register type="NOA" address="0x00009888" value="0x4F800004" />
+        <register type="NOA" address="0x00009888" value="0x418014A0" />
+        <register type="NOA" address="0x00009888" value="0x31800000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x10800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x0007C000" />
+        <register type="OA" address="0x00002774" value="0x000007FF" />
+    </register_config>
+  </set>
+
+  <set name="MDAPI testing set Gen8"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="test_oa"
+       hw_config_guid="d6de6f55-e526-4f79-a6a6-d7315c09044e"
+       chipset="BDW"
+       symbol_name="TestOa"
+       >
+    <counter name="TestCounter7"
+             description="HW test counter 7. Factor: 0.666"
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="counter7"
+             units="events"
+             symbol_name="Counter7"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="TestCounter8"
+             description="HW test counter 8. Should be equal to 1."
+             data_type="uint64"
+             equation="C 7 READ"
+             underscore_name="counter8"
+             units="events"
+             symbol_name="Counter8"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter4"
+             description="HW test counter 4. Factor: 0.333"
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="counter4"
+             units="events"
+             symbol_name="Counter4"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter5"
+             description="HW test counter 5. Factor: 0.333"
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="counter5"
+             units="events"
+             symbol_name="Counter5"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter6"
+             description="HW test counter 6. Factor: 0.166"
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="counter6"
+             units="events"
+             symbol_name="Counter6"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter3"
+             description="HW test counter 3. Factor: 0.5"
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="counter3"
+             units="events"
+             symbol_name="Counter3"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter0"
+             description="HW test counter 0. Factor: 0.0"
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="counter0"
+             units="events"
+             symbol_name="Counter0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter1"
+             description="HW test counter 1. Factor: 1.0"
+             data_type="uint64"
+             equation="B 1 READ"
+             underscore_name="counter1"
+             units="events"
+             symbol_name="Counter1"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter2"
+             description="HW test counter 2. Factor: 1.0"
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="counter2"
+             units="events"
+             symbol_name="Counter2"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x198B0000" />
+        <register type="NOA" address="0x00009888" value="0x078B0066" />
+        <register type="NOA" address="0x00009888" value="0x118B0000" />
+        <register type="NOA" address="0x00009888" value="0x258B0000" />
+        <register type="NOA" address="0x00009888" value="0x21850008" />
+        <register type="NOA" address="0x00009888" value="0x0D834000" />
+        <register type="NOA" address="0x00009888" value="0x07844000" />
+        <register type="NOA" address="0x00009888" value="0x17804000" />
+        <register type="NOA" address="0x00009888" value="0x21800000" />
+        <register type="NOA" address="0x00009888" value="0x4F800000" />
+        <register type="NOA" address="0x00009888" value="0x41800000" />
+        <register type="NOA" address="0x00009888" value="0x31800000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x00000004" />
+        <register type="OA" address="0x00002774" value="0x00000000" />
+        <register type="OA" address="0x00002778" value="0x00000003" />
+        <register type="OA" address="0x0000277C" value="0x00000000" />
+        <register type="OA" address="0x00002780" value="0x00000007" />
+        <register type="OA" address="0x00002784" value="0x00000000" />
+        <register type="OA" address="0x00002788" value="0x00100002" />
+        <register type="OA" address="0x0000278C" value="0x0000FFF7" />
+        <register type="OA" address="0x00002790" value="0x00100002" />
+        <register type="OA" address="0x00002794" value="0x0000FFCF" />
+        <register type="OA" address="0x00002798" value="0x00100082" />
+        <register type="OA" address="0x0000279C" value="0x0000FFEF" />
+        <register type="OA" address="0x000027A0" value="0x001000C2" />
+        <register type="OA" address="0x000027A4" value="0x0000FFE7" />
+        <register type="OA" address="0x000027A8" value="0x00100001" />
+        <register type="OA" address="0x000027AC" value="0x0000FFE7" />
+    </register_config>
+  </set>
+
+  <set name="Metric set PMA Stall"
+       mdapi_supported_apis="VK OGL OGL4 IO BB"
+       underscore_name="stc__pma_stall"
+       hw_config_guid="e713f347-953e-4d8c-b02f-6be31df2db2b"
+       chipset="BDW"
+       symbol_name="STC_PmaStall"
+       >
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="STC PMA stall"
+             description="Percentage of time when stencil cache line and an overlapping pixel are causing stalls"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="stc_pma_stall"
+             units="percent"
+             symbol_name="StcPMAStall"
+             availability="$SliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_group="GPU/Stencil Cache"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x0C1F0001" />
+        <register type="NOA" address="0x00009888" value="0x001F0015" />
+        <register type="NOA" address="0x00009888" value="0x041F4AC0" />
+        <register type="NOA" address="0x00009888" value="0x061F03D8" />
+        <register type="NOA" address="0x00009888" value="0x0E1F0000" />
+        <register type="NOA" address="0x00009888" value="0x018A8000" />
+        <register type="NOA" address="0x00009888" value="0x0F8A8000" />
+        <register type="NOA" address="0x00009888" value="0x198A8000" />
+        <register type="NOA" address="0x00009888" value="0x1B8A00A0" />
+        <register type="NOA" address="0x00009888" value="0x238B0020" />
+        <register type="NOA" address="0x00009888" value="0x258B0550" />
+        <register type="NOA" address="0x00009888" value="0x1F850080" />
+        <register type="NOA" address="0x00009888" value="0x21850AA0" />
+        <register type="NOA" address="0x00009888" value="0x01834000" />
+        <register type="NOA" address="0x00009888" value="0x0F834000" />
+        <register type="NOA" address="0x00009888" value="0x19835400" />
+        <register type="NOA" address="0x00009888" value="0x01844000" />
+        <register type="NOA" address="0x00009888" value="0x07848000" />
+        <register type="NOA" address="0x00009888" value="0x0984C000" />
+        <register type="NOA" address="0x00009888" value="0x0B844000" />
+        <register type="NOA" address="0x00009888" value="0x11804000" />
+        <register type="NOA" address="0x00009888" value="0x17808000" />
+        <register type="NOA" address="0x00009888" value="0x1980C000" />
+        <register type="NOA" address="0x00009888" value="0x1B804000" />
+        <register type="NOA" address="0x00009888" value="0x4D800000" />
+        <register type="NOA" address="0x00009888" value="0x3D800000" />
+        <register type="NOA" address="0x00009888" value="0x4F800000" />
+        <register type="NOA" address="0x00009888" value="0x43800000" />
+        <register type="NOA" address="0x00009888" value="0x51800000" />
+        <register type="NOA" address="0x00009888" value="0x45800000" />
+        <register type="NOA" address="0x00009888" value="0x21800000" />
+        <register type="NOA" address="0x00009888" value="0x31800000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x10800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x008000E1" />
+        <register type="OA" address="0x00002774" value="0x001FFFE0" />
+    </register_config>
+  </set>
+
+</metrics>
diff --git a/lib/i915/perf-configs/oa-bxt.xml b/lib/i915/perf-configs/oa-bxt.xml
new file mode 100644
index 00000000..5bcbc8e7
--- /dev/null
+++ b/lib/i915/perf-configs/oa-bxt.xml
@@ -0,0 +1,9595 @@
+<?xml version="1.0"?>
+<metrics version="1581935519" merge_md5="">
+  <set name="Render Metrics Basic Gen9"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="render_basic"
+       hw_config_guid="22b9519a-e9ba-4c41-8b54-f4f8ca14fa0a"
+       chipset="BXT"
+       symbol_name="RenderBasic"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Misses"
+             description="The total number of L3 misses."
+             data_type="uint64"
+             equation="C 4 READ"
+             underscore_name="l3_misses"
+             units="messages"
+             symbol_name="L3Misses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/TAG"
+             />
+    <counter name="GTI L3 Throughput"
+             description="The total number of GPU memory bytes transferred between L3 caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="$L3Misses 64 UMUL"
+             underscore_name="gti_l3_throughput"
+             units="bytes"
+             symbol_name="GtiL3Throughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Cache Misses"
+             description="The total number of sampler cache misses in all LODs in all sampler units."
+             data_type="uint64"
+             equation="B 4 READ 8 UMUL"
+             underscore_name="sampler_l1_misses"
+             units="messages"
+             symbol_name="SamplerL1Misses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler 1 Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which Sampler 1 has been slowing down the pipe when processing EU requests."
+             data_type="float"
+             high_watermark="15"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="sampler1_bottleneck"
+             units="percent"
+             symbol_name="Sampler1Bottleneck"
+             availability="$SubsliceMask 0x12 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="L3 Sampler Throughput"
+             description="The total number of GPU memory bytes transferred between samplers and L3 caches."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="$SamplerL1Misses 64 UMUL"
+             underscore_name="l3_sampler_throughput"
+             units="bytes"
+             symbol_name="L3SamplerThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Sampler"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Sampler 0 Busy"
+             description="The percentage of time in which Sampler 0 has been processing EU requests."
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler0_busy"
+             units="percent"
+             symbol_name="Sampler0Busy"
+             availability="$SubsliceMask 0x09 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Sampler 1 Busy"
+             description="The percentage of time in which Sampler 1 has been processing EU requests."
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler1_busy"
+             units="percent"
+             symbol_name="Sampler1Busy"
+             availability="$SubsliceMask 0x12 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Samplers Busy"
+             description="The percentage of time in which samplers have been processing EU requests."
+             data_type="float"
+             max_equation="100"
+             equation="$Sampler0Busy $Sampler1Busy FMAX"
+             underscore_name="samplers_busy"
+             units="percent"
+             symbol_name="SamplersBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="GTI Fixed Pipe Throughput"
+             description="The total number of GPU memory bytes transferred between 3D Pipeline (Command Dispatch, Input Assembly and Stream Output) and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="B 6 READ B 7 READ UADD 64 UMUL"
+             underscore_name="gti_vf_throughput"
+             units="bytes"
+             symbol_name="GtiVfThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/3D Pipe"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler 0 Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which Sampler 0 has been slowing down the pipe when processing EU requests."
+             data_type="float"
+             high_watermark="15"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="sampler0_bottleneck"
+             units="percent"
+             symbol_name="Sampler0Bottleneck"
+             availability="$SubsliceMask 0x09 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="L3 Lookup Accesses w/o IC"
+             description="The total number of L3 cache lookup accesses w/o IC."
+             data_type="uint64"
+             equation="$SamplerL1Misses $ShaderMemoryAccesses UADD"
+             underscore_name="l3_lookups"
+             units="messages"
+             symbol_name="L3Lookups"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/TAG"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Read Throughput"
+             description="The total number of GPU memory bytes read from GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="C 6 READ 64 UMUL"
+             underscore_name="gti_read_throughput"
+             units="bytes"
+             symbol_name="GtiReadThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Depth Throughput"
+             description="The total number of GPU memory bytes transferred between depth caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 0 READ C 1 READ UADD 64 UMUL"
+             underscore_name="gti_depth_throughput"
+             units="bytes"
+             symbol_name="GtiDepthThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/Depth Cache"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Samplers Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which samplers have been slowing down the pipe when processing EU requests."
+             data_type="float"
+             high_watermark="15"
+             equation="$Sampler0Bottleneck $Sampler1Bottleneck FMAX"
+             max_equation="100"
+             underscore_name="sampler_bottleneck"
+             units="percent"
+             symbol_name="SamplerBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Indicate System Frame Batch Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="GTI HDC TLB Lookup Throughput"
+             description="The total number of GPU memory bytes transferred between GTI and HDC, when HDC is doing TLB lookups."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 5 READ 64 UMUL"
+             underscore_name="gti_hdc_lookups_throughput"
+             units="bytes"
+             symbol_name="GtiHdcLookupsThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI RCC Throughput"
+             description="The total number of GPU memory bytes transferred between render color caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 2 READ C 3 READ UADD 64 UMUL"
+             underscore_name="gti_rcc_throughput"
+             units="bytes"
+             symbol_name="GtiRccThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/Color Cache"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="GTI Write Throughput"
+             description="The total number of GPU memory bytes written to GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 32 UMUL"
+             equation="C 7 READ 64 UMUL"
+             underscore_name="gti_write_throughput"
+             units="bytes"
+             symbol_name="GtiWriteThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA"
+                     availability="$SkuRevisionId 0x03 UGTE"
+                     priority="0"
+                     >
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x166C00F0" />
+        <register type="NOA" address="0x00009888" value="0x12120280" />
+        <register type="NOA" address="0x00009888" value="0x12320280" />
+        <register type="NOA" address="0x00009888" value="0x11930317" />
+        <register type="NOA" address="0x00009888" value="0x159303DF" />
+        <register type="NOA" address="0x00009888" value="0x3F900C00" />
+        <register type="NOA" address="0x00009888" value="0x419000A0" />
+        <register type="NOA" address="0x00009888" value="0x002D1000" />
+        <register type="NOA" address="0x00009888" value="0x062D4000" />
+        <register type="NOA" address="0x00009888" value="0x082D5000" />
+        <register type="NOA" address="0x00009888" value="0x0A2D1000" />
+        <register type="NOA" address="0x00009888" value="0x0C2E0800" />
+        <register type="NOA" address="0x00009888" value="0x0E2E5900" />
+        <register type="NOA" address="0x00009888" value="0x0A4C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C4C8000" />
+        <register type="NOA" address="0x00009888" value="0x0E4C4000" />
+        <register type="NOA" address="0x00009888" value="0x064E8000" />
+        <register type="NOA" address="0x00009888" value="0x084E8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4E2000" />
+        <register type="NOA" address="0x00009888" value="0x1C4F0010" />
+        <register type="NOA" address="0x00009888" value="0x0A6C0053" />
+        <register type="NOA" address="0x00009888" value="0x106C0000" />
+        <register type="NOA" address="0x00009888" value="0x1C6C0000" />
+        <register type="NOA" address="0x00009888" value="0x1A0FCC00" />
+        <register type="NOA" address="0x00009888" value="0x1C0F0002" />
+        <register type="NOA" address="0x00009888" value="0x1C2C0040" />
+        <register type="NOA" address="0x00009888" value="0x00101000" />
+        <register type="NOA" address="0x00009888" value="0x04101000" />
+        <register type="NOA" address="0x00009888" value="0x00114000" />
+        <register type="NOA" address="0x00009888" value="0x08114000" />
+        <register type="NOA" address="0x00009888" value="0x00120020" />
+        <register type="NOA" address="0x00009888" value="0x08120021" />
+        <register type="NOA" address="0x00009888" value="0x00141000" />
+        <register type="NOA" address="0x00009888" value="0x08141000" />
+        <register type="NOA" address="0x00009888" value="0x02308000" />
+        <register type="NOA" address="0x00009888" value="0x04302000" />
+        <register type="NOA" address="0x00009888" value="0x06318000" />
+        <register type="NOA" address="0x00009888" value="0x08318000" />
+        <register type="NOA" address="0x00009888" value="0x06320800" />
+        <register type="NOA" address="0x00009888" value="0x08320840" />
+        <register type="NOA" address="0x00009888" value="0x00320000" />
+        <register type="NOA" address="0x00009888" value="0x06344000" />
+        <register type="NOA" address="0x00009888" value="0x08344000" />
+        <register type="NOA" address="0x00009888" value="0x0D931831" />
+        <register type="NOA" address="0x00009888" value="0x0F939F3F" />
+        <register type="NOA" address="0x00009888" value="0x01939E80" />
+        <register type="NOA" address="0x00009888" value="0x039303BC" />
+        <register type="NOA" address="0x00009888" value="0x0593000E" />
+        <register type="NOA" address="0x00009888" value="0x1993002A" />
+        <register type="NOA" address="0x00009888" value="0x07930000" />
+        <register type="NOA" address="0x00009888" value="0x09930000" />
+        <register type="NOA" address="0x00009888" value="0x1D900177" />
+        <register type="NOA" address="0x00009888" value="0x1F900187" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x13904000" />
+        <register type="NOA" address="0x00009888" value="0x21904000" />
+        <register type="NOA" address="0x00009888" value="0x23904000" />
+        <register type="NOA" address="0x00009888" value="0x25904000" />
+        <register type="NOA" address="0x00009888" value="0x27904000" />
+        <register type="NOA" address="0x00009888" value="0x2B904000" />
+        <register type="NOA" address="0x00009888" value="0x2D904000" />
+        <register type="NOA" address="0x00009888" value="0x2F904000" />
+        <register type="NOA" address="0x00009888" value="0x31904000" />
+        <register type="NOA" address="0x00009888" value="0x15904000" />
+        <register type="NOA" address="0x00009888" value="0x17904000" />
+        <register type="NOA" address="0x00009888" value="0x19904000" />
+        <register type="NOA" address="0x00009888" value="0x1B904000" />
+        <register type="NOA" address="0x00009888" value="0x53901110" />
+        <register type="NOA" address="0x00009888" value="0x43900423" />
+        <register type="NOA" address="0x00009888" value="0x55900111" />
+        <register type="NOA" address="0x00009888" value="0x47900C02" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900020" />
+        <register type="NOA" address="0x00009888" value="0x59901111" />
+        <register type="NOA" address="0x00009888" value="0x4B900421" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4D900001" />
+        <register type="NOA" address="0x00009888" value="0x45900821" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Compute Metrics Basic Gen9"
+       mdapi_supported_apis="VK OGL4 OCL IO BB"
+       underscore_name="compute_basic"
+       hw_config_guid="012d72cf-82a9-4d25-8ddf-74076fd30797"
+       chipset="BXT"
+       symbol_name="ComputeBasic"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Untyped Bytes Read"
+             description="The total number of typed memory bytes read via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="B 6 READ B 7 READ UADD $EuSlicesTotalCount 64 UMUL UMUL"
+             underscore_name="untyped_bytes_read"
+             units="bytes"
+             symbol_name="UntypedBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Typed Bytes Written"
+             description="The total number of untyped memory bytes written via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="B 3 READ B 4 READ UADD $EuSlicesTotalCount 64 UMUL UMUL"
+             underscore_name="typed_bytes_written"
+             units="bytes"
+             symbol_name="TypedBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu0_active"
+             units="percent"
+             symbol_name="Fpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active"
+             units="percent"
+             symbol_name="Fpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU AVG IPC Rate"
+             description="The average rate of IPC calculated for 2 FPU pipelines."
+             data_type="float"
+             max_equation="2"
+             equation="A 9 READ  A 10 READ  A 11 READ UADD  A 9 READ USUB FDIV 1 FADD"
+             underscore_name="eu_avg_ipc_rate"
+             units="number"
+             symbol_name="EuAvgIpcRate"
+             semantic_type="ratio"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Read Throughput"
+             description="The total number of GPU memory bytes read from GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 4 READ 64 UMUL"
+             underscore_name="gti_read_throughput"
+             units="bytes"
+             symbol_name="GtiReadThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Untyped Writes"
+             description="The total number of untyped memory bytes written via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 1 READ C 2 READ UADD $EuSlicesTotalCount 64 UMUL UMUL"
+             underscore_name="untyped_bytes_written"
+             units="bytes"
+             symbol_name="UntypedBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="Typed Bytes Read"
+             description="The total number of typed memory bytes read via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="B 0 READ B 1 READ UADD $EuSlicesTotalCount 64 UMUL UMUL"
+             underscore_name="typed_bytes_read"
+             units="bytes"
+             symbol_name="TypedBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="EU Thread Occupancy"
+             description="The percentage of time in which hardware threads occupied EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ 8 UMUL $EuCoresTotalCount UDIV $EuThreadsCount UDIV 100 UMUL  $GpuCoreClocks FDIV"
+             underscore_name="eu_thread_occupancy"
+             units="percent"
+             symbol_name="EuThreadOccupancy"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="GTI Write Throughput"
+             description="The total number of GPU memory bytes written to GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 32 UMUL"
+             equation="C 5 READ 64 UMUL"
+             underscore_name="gti_write_throughput"
+             units="bytes"
+             symbol_name="GtiWriteThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="EU Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_send_active"
+             units="percent"
+             symbol_name="EuSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x104F00E0" />
+        <register type="NOA" address="0x00009888" value="0x124F1C00" />
+        <register type="NOA" address="0x00009888" value="0x39900340" />
+        <register type="NOA" address="0x00009888" value="0x3F900C00" />
+        <register type="NOA" address="0x00009888" value="0x41900000" />
+        <register type="NOA" address="0x00009888" value="0x002D5000" />
+        <register type="NOA" address="0x00009888" value="0x062D4000" />
+        <register type="NOA" address="0x00009888" value="0x082D4000" />
+        <register type="NOA" address="0x00009888" value="0x0A2D1000" />
+        <register type="NOA" address="0x00009888" value="0x0C2D5000" />
+        <register type="NOA" address="0x00009888" value="0x0E2D4000" />
+        <register type="NOA" address="0x00009888" value="0x0C2E1400" />
+        <register type="NOA" address="0x00009888" value="0x0E2E5100" />
+        <register type="NOA" address="0x00009888" value="0x102E0114" />
+        <register type="NOA" address="0x00009888" value="0x044CC000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C4C8000" />
+        <register type="NOA" address="0x00009888" value="0x0E4C4000" />
+        <register type="NOA" address="0x00009888" value="0x104C8000" />
+        <register type="NOA" address="0x00009888" value="0x124C8000" />
+        <register type="NOA" address="0x00009888" value="0x164C2000" />
+        <register type="NOA" address="0x00009888" value="0x004EA000" />
+        <register type="NOA" address="0x00009888" value="0x064E8000" />
+        <register type="NOA" address="0x00009888" value="0x084E8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4E2000" />
+        <register type="NOA" address="0x00009888" value="0x0C4EA000" />
+        <register type="NOA" address="0x00009888" value="0x0E4E8000" />
+        <register type="NOA" address="0x00009888" value="0x004F6B42" />
+        <register type="NOA" address="0x00009888" value="0x064F6200" />
+        <register type="NOA" address="0x00009888" value="0x084F4100" />
+        <register type="NOA" address="0x00009888" value="0x0A4F0061" />
+        <register type="NOA" address="0x00009888" value="0x0C4F6C4C" />
+        <register type="NOA" address="0x00009888" value="0x0E4F4B00" />
+        <register type="NOA" address="0x00009888" value="0x1A4F0000" />
+        <register type="NOA" address="0x00009888" value="0x1C4F0000" />
+        <register type="NOA" address="0x00009888" value="0x180F5000" />
+        <register type="NOA" address="0x00009888" value="0x1A0F8800" />
+        <register type="NOA" address="0x00009888" value="0x1C0F08A2" />
+        <register type="NOA" address="0x00009888" value="0x182C4000" />
+        <register type="NOA" address="0x00009888" value="0x1C2C1451" />
+        <register type="NOA" address="0x00009888" value="0x1E2C0001" />
+        <register type="NOA" address="0x00009888" value="0x1A2C0010" />
+        <register type="NOA" address="0x00009888" value="0x01938000" />
+        <register type="NOA" address="0x00009888" value="0x0F938000" />
+        <register type="NOA" address="0x00009888" value="0x19938A28" />
+        <register type="NOA" address="0x00009888" value="0x03938000" />
+        <register type="NOA" address="0x00009888" value="0x19900177" />
+        <register type="NOA" address="0x00009888" value="0x1B900178" />
+        <register type="NOA" address="0x00009888" value="0x1D900125" />
+        <register type="NOA" address="0x00009888" value="0x1F900123" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x13904000" />
+        <register type="NOA" address="0x00009888" value="0x21904000" />
+        <register type="NOA" address="0x00009888" value="0x25904000" />
+        <register type="NOA" address="0x00009888" value="0x27904000" />
+        <register type="NOA" address="0x00009888" value="0x2B904000" />
+        <register type="NOA" address="0x00009888" value="0x2D904000" />
+        <register type="NOA" address="0x00009888" value="0x31904000" />
+        <register type="NOA" address="0x00009888" value="0x15904000" />
+        <register type="NOA" address="0x00009888" value="0x53901000" />
+        <register type="NOA" address="0x00009888" value="0x43900000" />
+        <register type="NOA" address="0x00009888" value="0x55900111" />
+        <register type="NOA" address="0x00009888" value="0x47900000" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900000" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4D900000" />
+        <register type="NOA" address="0x00009888" value="0x45900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00000003" />
+        <register type="FLEX" address="0x0000E658" value="0x00002001" />
+        <register type="FLEX" address="0x0000E758" value="0x00778008" />
+        <register type="FLEX" address="0x0000E45C" value="0x00088078" />
+        <register type="FLEX" address="0x0000E55C" value="0x00808708" />
+        <register type="FLEX" address="0x0000E65C" value="0x00A08908" />
+    </register_config>
+  </set>
+
+  <set name="Render Metrics for 3D Pipeline Profile Gen9"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="render_pipe_profile"
+       hw_config_guid="ce416533-e49e-4211-80af-ec513590a914"
+       chipset="BXT"
+       symbol_name="RenderPipeProfile"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Bottleneck"
+             low_watermark="10"
+             description="The percentage of time in which vertex shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="30"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_bottleneck"
+             units="percent"
+             symbol_name="VsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Hi-Depth Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which early hierarchical depth test pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="hi_depth_bottleneck"
+             units="percent"
+             symbol_name="HiDepthBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which geometry shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gs_bottleneck"
+             units="percent"
+             symbol_name="GsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Geometry Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="BC Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which barycentric coordinates calculation pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="bc_bottleneck"
+             units="percent"
+             symbol_name="BcBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Barycentric Calc"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HS Stall"
+             description="The percentage of time in which hull stall pipeline stage was stalled."
+             data_type="float"
+             equation="C 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="hs_stall"
+             units="percent"
+             symbol_name="HsStall"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Hull Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="VF Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which vertex fetch pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="C 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vf_bottleneck"
+             units="percent"
+             symbol_name="VfBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Input Assembler"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Strip-Fans Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which strip-fans pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="10"
+             equation="B 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sf_bottleneck"
+             units="percent"
+             symbol_name="SfBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Strip-Fans"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SF Stall"
+             description="The percentage of time in which strip-fans pipeline stage was stalled."
+             data_type="float"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sf_stall"
+             units="percent"
+             symbol_name="SfStall"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Strip-Fans"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HS Bottleneck"
+             low_watermark="3"
+             description="The percentage of time in which hull shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="9"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="hs_bottleneck"
+             units="percent"
+             symbol_name="HsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Hull Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="CL Stall"
+             description="The percentage of time in which clipper pipeline stage was stalled."
+             data_type="float"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="cl_stall"
+             units="percent"
+             symbol_name="ClStall"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Clipper"
+             />
+    <counter name="SO Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which stream output pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="so_bottleneck"
+             units="percent"
+             symbol_name="SoBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Stream Output"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="DS Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which domain shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ds_bottleneck"
+             units="percent"
+             symbol_name="DsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Domain Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Clipper Bottleneck"
+             low_watermark="10"
+             description="The percentage of time in which clipper pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="30"
+             equation="B 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="cl_bottleneck"
+             units="percent"
+             symbol_name="ClBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Clipper"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Stall"
+             description="The percentage of time in which domain shader pipeline stage was stalled."
+             data_type="float"
+             equation="C 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ds_stall"
+             units="percent"
+             symbol_name="DsStall"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Domain Shader"
+             />
+    <counter name="Early Depth Bottleneck"
+             low_watermark="10"
+             description="The percentage of time in which early depth test pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="30"
+             equation="B 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="early_depth_bottleneck"
+             units="percent"
+             symbol_name="EarlyDepthBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="SO Stall"
+             description="The percentage of time in which stream-output pipeline stage was stalled."
+             data_type="float"
+             equation="C 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="so_stall"
+             units="percent"
+             symbol_name="SoStall"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Stream Output"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x0C2E001F" />
+        <register type="NOA" address="0x00009888" value="0x0A2F0000" />
+        <register type="NOA" address="0x00009888" value="0x10186800" />
+        <register type="NOA" address="0x00009888" value="0x11810019" />
+        <register type="NOA" address="0x00009888" value="0x15810013" />
+        <register type="NOA" address="0x00009888" value="0x13820020" />
+        <register type="NOA" address="0x00009888" value="0x11830020" />
+        <register type="NOA" address="0x00009888" value="0x17840000" />
+        <register type="NOA" address="0x00009888" value="0x11860007" />
+        <register type="NOA" address="0x00009888" value="0x21860000" />
+        <register type="NOA" address="0x00009888" value="0x178703E0" />
+        <register type="NOA" address="0x00009888" value="0x0C2D8000" />
+        <register type="NOA" address="0x00009888" value="0x042D4000" />
+        <register type="NOA" address="0x00009888" value="0x062D1000" />
+        <register type="NOA" address="0x00009888" value="0x022E5400" />
+        <register type="NOA" address="0x00009888" value="0x002E0000" />
+        <register type="NOA" address="0x00009888" value="0x0E2E0080" />
+        <register type="NOA" address="0x00009888" value="0x082F0040" />
+        <register type="NOA" address="0x00009888" value="0x002F0000" />
+        <register type="NOA" address="0x00009888" value="0x06143000" />
+        <register type="NOA" address="0x00009888" value="0x06174000" />
+        <register type="NOA" address="0x00009888" value="0x06180012" />
+        <register type="NOA" address="0x00009888" value="0x00180000" />
+        <register type="NOA" address="0x00009888" value="0x0D804000" />
+        <register type="NOA" address="0x00009888" value="0x0F804000" />
+        <register type="NOA" address="0x00009888" value="0x05804000" />
+        <register type="NOA" address="0x00009888" value="0x09810200" />
+        <register type="NOA" address="0x00009888" value="0x0B810030" />
+        <register type="NOA" address="0x00009888" value="0x03810003" />
+        <register type="NOA" address="0x00009888" value="0x21819140" />
+        <register type="NOA" address="0x00009888" value="0x23819050" />
+        <register type="NOA" address="0x00009888" value="0x25810018" />
+        <register type="NOA" address="0x00009888" value="0x0B820980" />
+        <register type="NOA" address="0x00009888" value="0x03820D80" />
+        <register type="NOA" address="0x00009888" value="0x11820000" />
+        <register type="NOA" address="0x00009888" value="0x0182C000" />
+        <register type="NOA" address="0x00009888" value="0x07828000" />
+        <register type="NOA" address="0x00009888" value="0x09824000" />
+        <register type="NOA" address="0x00009888" value="0x0F828000" />
+        <register type="NOA" address="0x00009888" value="0x0D830004" />
+        <register type="NOA" address="0x00009888" value="0x0583000C" />
+        <register type="NOA" address="0x00009888" value="0x0F831000" />
+        <register type="NOA" address="0x00009888" value="0x01848072" />
+        <register type="NOA" address="0x00009888" value="0x11840000" />
+        <register type="NOA" address="0x00009888" value="0x07848000" />
+        <register type="NOA" address="0x00009888" value="0x09844000" />
+        <register type="NOA" address="0x00009888" value="0x0F848000" />
+        <register type="NOA" address="0x00009888" value="0x07860000" />
+        <register type="NOA" address="0x00009888" value="0x09860092" />
+        <register type="NOA" address="0x00009888" value="0x0F860400" />
+        <register type="NOA" address="0x00009888" value="0x01869100" />
+        <register type="NOA" address="0x00009888" value="0x0F870065" />
+        <register type="NOA" address="0x00009888" value="0x01870000" />
+        <register type="NOA" address="0x00009888" value="0x19930800" />
+        <register type="NOA" address="0x00009888" value="0x0B938000" />
+        <register type="NOA" address="0x00009888" value="0x0D938000" />
+        <register type="NOA" address="0x00009888" value="0x1B952000" />
+        <register type="NOA" address="0x00009888" value="0x1D955055" />
+        <register type="NOA" address="0x00009888" value="0x1F951455" />
+        <register type="NOA" address="0x00009888" value="0x0992A000" />
+        <register type="NOA" address="0x00009888" value="0x0F928000" />
+        <register type="NOA" address="0x00009888" value="0x1192A800" />
+        <register type="NOA" address="0x00009888" value="0x1392028A" />
+        <register type="NOA" address="0x00009888" value="0x0B92A000" />
+        <register type="NOA" address="0x00009888" value="0x0D922000" />
+        <register type="NOA" address="0x00009888" value="0x13908000" />
+        <register type="NOA" address="0x00009888" value="0x21908000" />
+        <register type="NOA" address="0x00009888" value="0x23908000" />
+        <register type="NOA" address="0x00009888" value="0x25908000" />
+        <register type="NOA" address="0x00009888" value="0x27908000" />
+        <register type="NOA" address="0x00009888" value="0x29908000" />
+        <register type="NOA" address="0x00009888" value="0x2B908000" />
+        <register type="NOA" address="0x00009888" value="0x2D904000" />
+        <register type="NOA" address="0x00009888" value="0x2F908000" />
+        <register type="NOA" address="0x00009888" value="0x31908000" />
+        <register type="NOA" address="0x00009888" value="0x15908000" />
+        <register type="NOA" address="0x00009888" value="0x17908000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B908000" />
+        <register type="NOA" address="0x00009888" value="0x1D904000" />
+        <register type="NOA" address="0x00009888" value="0x1F904000" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x43900C01" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x47900000" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900863" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900061" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4D900000" />
+        <register type="NOA" address="0x00009888" value="0x45900C22" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007FFEA" />
+        <register type="OA" address="0x00002774" value="0x00007FFC" />
+        <register type="OA" address="0x00002778" value="0x0007AFFA" />
+        <register type="OA" address="0x0000277C" value="0x0000F5FD" />
+        <register type="OA" address="0x00002780" value="0x00079FFA" />
+        <register type="OA" address="0x00002784" value="0x0000F3FB" />
+        <register type="OA" address="0x00002788" value="0x0007BF7A" />
+        <register type="OA" address="0x0000278C" value="0x0000F7E7" />
+        <register type="OA" address="0x00002790" value="0x0007FEFA" />
+        <register type="OA" address="0x00002794" value="0x0000F7CF" />
+        <register type="OA" address="0x00002798" value="0x00077FFA" />
+        <register type="OA" address="0x0000279C" value="0x0000EFDF" />
+        <register type="OA" address="0x000027A0" value="0x0006FFFA" />
+        <register type="OA" address="0x000027A4" value="0x0000CFBF" />
+        <register type="OA" address="0x000027A8" value="0x0003FFFA" />
+        <register type="OA" address="0x000027AC" value="0x00005F7F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00015014" />
+        <register type="FLEX" address="0x0000E658" value="0x00025024" />
+        <register type="FLEX" address="0x0000E758" value="0x00035034" />
+        <register type="FLEX" address="0x0000E45C" value="0x00045044" />
+        <register type="FLEX" address="0x0000E55C" value="0x00055054" />
+        <register type="FLEX" address="0x0000E65C" value="0x00065064" />
+    </register_config>
+  </set>
+
+  <set name="Memory Reads Distribution Gen9"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="memory_reads"
+       hw_config_guid="398e2452-18d7-42d0-b241-e4d0a9148ada"
+       chipset="BXT"
+       symbol_name="MemoryReads"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiL3Bank0Reads"
+             description="The total number of GTI memory reads from L3 Bank 0 (L3 Cache misses)."
+             data_type="uint64"
+             equation="C 4 READ"
+             underscore_name="gti_l3_bank0_reads"
+             units="messages"
+             symbol_name="GtiL3Bank0Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="GtiRingAccesses"
+             description="The total number of all accesses from GTI to the ring."
+             data_type="uint64"
+             equation="C 3 READ 2 UMUL"
+             underscore_name="gti_ring_accesses"
+             units="messages"
+             symbol_name="GtiRingAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="GtiL3Bank3Reads"
+             description="The total number of GTI memory reads from L3 Bank 3 (L3 Cache misses)."
+             data_type="uint64"
+             equation="C 7 READ"
+             underscore_name="gti_l3_bank3_reads"
+             units="messages"
+             symbol_name="GtiL3Bank3Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="GtiRsMemoryReads"
+             description="The total number of GTI memory reads from Resource Streamer."
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="gti_rs_memory_reads"
+             units="messages"
+             symbol_name="GtiRsMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Resource Streamer"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GtiHizMemoryReads"
+             description="The total number of GTI memory reads from Hierarchical Depth Cache (Hi-Depth Cache misses)."
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="gti_hiz_memory_reads"
+             units="messages"
+             symbol_name="GtiHizMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="GtiRccMemoryReads"
+             description="The total number of GTI memory reads from Render Color Cache (Render Color Cache misses)."
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="gti_rcc_memory_reads"
+             units="messages"
+             symbol_name="GtiRccMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Color Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiL3Bank1Reads"
+             description="The total number of GTI memory reads from L3 Bank 1 (L3 Cache misses)."
+             data_type="uint64"
+             equation="C 5 READ"
+             underscore_name="gti_l3_bank1_reads"
+             units="messages"
+             symbol_name="GtiL3Bank1Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiCmdStreamerMemoryReads"
+             description="The total number of GTI memory reads from Command Streamer."
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="gti_cmd_streamer_memory_reads"
+             units="messages"
+             symbol_name="GtiCmdStreamerMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Command Streamer"
+             />
+    <counter name="GtiL3Bank2Reads"
+             description="The total number of GTI memory reads from L3 Bank 2 (L3 Cache misses)."
+             data_type="uint64"
+             equation="C 6 READ"
+             underscore_name="gti_l3_bank2_reads"
+             units="messages"
+             symbol_name="GtiL3Bank2Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiMemoryReads"
+             description="The total number of GTI memory reads."
+             data_type="uint64"
+             equation="C 0 READ"
+             underscore_name="gti_memory_reads"
+             units="messages"
+             symbol_name="GtiMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="GtiRczMemoryReads"
+             description="The total number of GTI memory reads from Render Depth Cache (Render Depth Cache misses)."
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="gti_rcz_memory_reads"
+             units="messages"
+             symbol_name="GtiRczMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="GtiMscMemoryReads"
+             description="The total number of GTI memory reads from Multisampling Color Cache (Multisampling Color Cache misses)."
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="gti_msc_memory_reads"
+             units="messages"
+             symbol_name="GtiMscMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Color Cache"
+             />
+    <counter name="GtiVfMemoryReads"
+             description="The total number of GTI memory reads from Vertex Fetch."
+             data_type="uint64"
+             equation="B 1 READ"
+             underscore_name="gti_vf_memory_reads"
+             units="messages"
+             symbol_name="GtiVfMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Vertex Fetch"
+             />
+    <counter name="GtiStcMemoryReads"
+             description="The total number of GTI memory reads from Stencil Cache (Stencil Cache misses)."
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="gti_stc_memory_reads"
+             units="messages"
+             symbol_name="GtiStcMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiL3Reads"
+             description="The total number of GTI memory reads from L3 (L3 Cache misses)."
+             data_type="uint64"
+             equation="$GtiL3Bank0Reads $GtiL3Bank1Reads $GtiL3Bank2Reads $GtiL3Bank3Reads UADD UADD UADD"
+             underscore_name="gti_l3_reads"
+             units="messages"
+             symbol_name="GtiL3Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x19800343" />
+        <register type="NOA" address="0x00009888" value="0x39900340" />
+        <register type="NOA" address="0x00009888" value="0x3F901000" />
+        <register type="NOA" address="0x00009888" value="0x41900003" />
+        <register type="NOA" address="0x00009888" value="0x03803180" />
+        <register type="NOA" address="0x00009888" value="0x058035E2" />
+        <register type="NOA" address="0x00009888" value="0x0780006A" />
+        <register type="NOA" address="0x00009888" value="0x11800000" />
+        <register type="NOA" address="0x00009888" value="0x2181A000" />
+        <register type="NOA" address="0x00009888" value="0x2381000A" />
+        <register type="NOA" address="0x00009888" value="0x1D950550" />
+        <register type="NOA" address="0x00009888" value="0x0B928000" />
+        <register type="NOA" address="0x00009888" value="0x0D92A000" />
+        <register type="NOA" address="0x00009888" value="0x0F922000" />
+        <register type="NOA" address="0x00009888" value="0x13900170" />
+        <register type="NOA" address="0x00009888" value="0x21900171" />
+        <register type="NOA" address="0x00009888" value="0x23900172" />
+        <register type="NOA" address="0x00009888" value="0x25900173" />
+        <register type="NOA" address="0x00009888" value="0x27900174" />
+        <register type="NOA" address="0x00009888" value="0x29900175" />
+        <register type="NOA" address="0x00009888" value="0x2B900176" />
+        <register type="NOA" address="0x00009888" value="0x2D900177" />
+        <register type="NOA" address="0x00009888" value="0x2F90017F" />
+        <register type="NOA" address="0x00009888" value="0x31900125" />
+        <register type="NOA" address="0x00009888" value="0x15900123" />
+        <register type="NOA" address="0x00009888" value="0x17900121" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B908000" />
+        <register type="NOA" address="0x00009888" value="0x1D908000" />
+        <register type="NOA" address="0x00009888" value="0x1F908000" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x43901084" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x47901080" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49901084" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x4B901084" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4D900004" />
+        <register type="NOA" address="0x00009888" value="0x45900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x0000272C" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002728" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x0000271C" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002718" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x0000274C" value="0x86543210" />
+        <register type="OA" address="0x00002748" value="0x86543210" />
+        <register type="OA" address="0x00002744" value="0x00006667" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x0000275C" value="0x86543210" />
+        <register type="OA" address="0x00002758" value="0x86543210" />
+        <register type="OA" address="0x00002754" value="0x00006465" />
+        <register type="OA" address="0x00002750" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007F81A" />
+        <register type="OA" address="0x00002774" value="0x0000FE00" />
+        <register type="OA" address="0x00002778" value="0x0007F82A" />
+        <register type="OA" address="0x0000277C" value="0x0000FE00" />
+        <register type="OA" address="0x00002780" value="0x0007F872" />
+        <register type="OA" address="0x00002784" value="0x0000FE00" />
+        <register type="OA" address="0x00002788" value="0x0007F8BA" />
+        <register type="OA" address="0x0000278C" value="0x0000FE00" />
+        <register type="OA" address="0x00002790" value="0x0007F87A" />
+        <register type="OA" address="0x00002794" value="0x0000FE00" />
+        <register type="OA" address="0x00002798" value="0x0007F8EA" />
+        <register type="OA" address="0x0000279C" value="0x0000FE00" />
+        <register type="OA" address="0x000027A0" value="0x0007F8E2" />
+        <register type="OA" address="0x000027A4" value="0x0000FE00" />
+        <register type="OA" address="0x000027A8" value="0x0007F8F2" />
+        <register type="OA" address="0x000027AC" value="0x0000FE00" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00015014" />
+        <register type="FLEX" address="0x0000E658" value="0x00025024" />
+        <register type="FLEX" address="0x0000E758" value="0x00035034" />
+        <register type="FLEX" address="0x0000E45C" value="0x00045044" />
+        <register type="FLEX" address="0x0000E55C" value="0x00055054" />
+        <register type="FLEX" address="0x0000E65C" value="0x00065064" />
+    </register_config>
+  </set>
+
+  <set name="Memory Writes Distribution Gen9"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="memory_writes"
+       hw_config_guid="d324a0d6-7269-4847-a5c2-6f71ddc7fed5"
+       chipset="BXT"
+       symbol_name="MemoryWrites"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiMemoryWrites"
+             description="The total number of GTI memory writes."
+             data_type="uint64"
+             equation="C 0 READ"
+             underscore_name="gti_memory_writes"
+             units="messages"
+             symbol_name="GtiMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="GtiRingAccesses"
+             description="The total number of all GTI accesses to the ring."
+             data_type="uint64"
+             equation="C 3 READ 2 UMUL"
+             underscore_name="gti_ring_accesses"
+             units="messages"
+             symbol_name="GtiRingAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="GtiMscMemoryWrites"
+             description="The total number of GTI memory writes from Multisampling Color Cache (Multisampling Color Cache invalidations)."
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="gti_msc_memory_writes"
+             units="messages"
+             symbol_name="GtiMscMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Color Cache"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="GtiCmdStreamerMemoryWrites"
+             description="The total number of GTI memory writes from Command Streamer."
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="gti_cmd_streamer_memory_writes"
+             units="messages"
+             symbol_name="GtiCmdStreamerMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Command Streamer"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GtiL3Bank0Writes"
+             description="The total number of GTI memory writes from L3 Bank 0 (L3 Bank 0 invalidations)."
+             data_type="uint64"
+             equation="C 4 READ"
+             underscore_name="gti_l3_bank0_writes"
+             units="messages"
+             symbol_name="GtiL3Bank0Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiL3Bank1Writes"
+             description="The total number of GTI memory writes from L3 Bank 1 (L3 Bank 1 invalidations)."
+             data_type="uint64"
+             equation="C 5 READ"
+             underscore_name="gti_l3_bank1_writes"
+             units="messages"
+             symbol_name="GtiL3Bank1Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiL3Bank2Writes"
+             description="The total number of GTI memory writes from L3 Bank 2 (L3 Bank 2 invalidations)."
+             data_type="uint64"
+             equation="C 6 READ"
+             underscore_name="gti_l3_bank2_writes"
+             units="messages"
+             symbol_name="GtiL3Bank2Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiL3Bank3Writes"
+             description="The total number of GTI memory writes from L3 Bank 3 (L3 Bank 3 invalidations)."
+             data_type="uint64"
+             equation="C 7 READ"
+             underscore_name="gti_l3_bank3_writes"
+             units="messages"
+             symbol_name="GtiL3Bank3Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiL3Writes"
+             description="The total number of GTI memory writes from L3 (L3 invalidations)."
+             data_type="uint64"
+             equation="$GtiL3Bank0Writes $GtiL3Bank1Writes $GtiL3Bank2Writes $GtiL3Bank3Writes UADD UADD UADD"
+             underscore_name="gti_l3_writes"
+             units="messages"
+             symbol_name="GtiL3Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiRccMemoryWrites"
+             description="The total number of GTI memory writes from Render Color Cache (Render Color Cache invalidations)."
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="gti_rcc_memory_writes"
+             units="messages"
+             symbol_name="GtiRccMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Color Cache"
+             />
+    <counter name="GtiSoMemoryWrites"
+             description="The total number of GTI memory writes from Stream Output."
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="gti_so_memory_writes"
+             units="messages"
+             symbol_name="GtiSoMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Stream Output"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiStcMemoryWrites"
+             description="The total number of GTI memory writes from Stencil Cache."
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="gti_stc_memory_writes"
+             units="messages"
+             symbol_name="GtiStcMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="GtiRczMemoryWrites"
+             description="The total number of GTI memory writes from Render Depth Cache."
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="gti_rcz_memory_writes"
+             units="messages"
+             symbol_name="GtiRczMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="GtiHizMemoryWrites"
+             description="The total number of GTI memory writes from Hierarchical Depth Cache."
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="gti_hiz_memory_writes"
+             units="messages"
+             symbol_name="GtiHizMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x19800343" />
+        <register type="NOA" address="0x00009888" value="0x39900340" />
+        <register type="NOA" address="0x00009888" value="0x3F900000" />
+        <register type="NOA" address="0x00009888" value="0x41900080" />
+        <register type="NOA" address="0x00009888" value="0x03803180" />
+        <register type="NOA" address="0x00009888" value="0x058035E2" />
+        <register type="NOA" address="0x00009888" value="0x0780006A" />
+        <register type="NOA" address="0x00009888" value="0x11800000" />
+        <register type="NOA" address="0x00009888" value="0x2181A000" />
+        <register type="NOA" address="0x00009888" value="0x2381000A" />
+        <register type="NOA" address="0x00009888" value="0x1D950550" />
+        <register type="NOA" address="0x00009888" value="0x0B928000" />
+        <register type="NOA" address="0x00009888" value="0x0D92A000" />
+        <register type="NOA" address="0x00009888" value="0x0F922000" />
+        <register type="NOA" address="0x00009888" value="0x13900180" />
+        <register type="NOA" address="0x00009888" value="0x21900181" />
+        <register type="NOA" address="0x00009888" value="0x23900182" />
+        <register type="NOA" address="0x00009888" value="0x25900183" />
+        <register type="NOA" address="0x00009888" value="0x27900184" />
+        <register type="NOA" address="0x00009888" value="0x29900185" />
+        <register type="NOA" address="0x00009888" value="0x2B900186" />
+        <register type="NOA" address="0x00009888" value="0x2D900187" />
+        <register type="NOA" address="0x00009888" value="0x2F900170" />
+        <register type="NOA" address="0x00009888" value="0x31900125" />
+        <register type="NOA" address="0x00009888" value="0x15900123" />
+        <register type="NOA" address="0x00009888" value="0x17900121" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B908000" />
+        <register type="NOA" address="0x00009888" value="0x1D908000" />
+        <register type="NOA" address="0x00009888" value="0x1F908000" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x43901084" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x47901080" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49901084" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x4B901084" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4D900004" />
+        <register type="NOA" address="0x00009888" value="0x45900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x0000272C" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002728" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x0000271C" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002718" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x0000274C" value="0x86543210" />
+        <register type="OA" address="0x00002748" value="0x86543210" />
+        <register type="OA" address="0x00002744" value="0x00006667" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x0000275C" value="0x86543210" />
+        <register type="OA" address="0x00002758" value="0x86543210" />
+        <register type="OA" address="0x00002754" value="0x00006465" />
+        <register type="OA" address="0x00002750" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007F81A" />
+        <register type="OA" address="0x00002774" value="0x0000FE00" />
+        <register type="OA" address="0x00002778" value="0x0007F82A" />
+        <register type="OA" address="0x0000277C" value="0x0000FE00" />
+        <register type="OA" address="0x00002780" value="0x0007F822" />
+        <register type="OA" address="0x00002784" value="0x0000FE00" />
+        <register type="OA" address="0x00002788" value="0x0007F8BA" />
+        <register type="OA" address="0x0000278C" value="0x0000FE00" />
+        <register type="OA" address="0x00002790" value="0x0007F87A" />
+        <register type="OA" address="0x00002794" value="0x0000FE00" />
+        <register type="OA" address="0x00002798" value="0x0007F8EA" />
+        <register type="OA" address="0x0000279C" value="0x0000FE00" />
+        <register type="OA" address="0x000027A0" value="0x0007F8E2" />
+        <register type="OA" address="0x000027A4" value="0x0000FE00" />
+        <register type="OA" address="0x000027A8" value="0x0007F8F2" />
+        <register type="OA" address="0x000027AC" value="0x0000FE00" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00015014" />
+        <register type="FLEX" address="0x0000E658" value="0x00025024" />
+        <register type="FLEX" address="0x0000E758" value="0x00035034" />
+        <register type="FLEX" address="0x0000E45C" value="0x00045044" />
+        <register type="FLEX" address="0x0000E55C" value="0x00055054" />
+        <register type="FLEX" address="0x0000E65C" value="0x00065064" />
+    </register_config>
+  </set>
+
+  <set name="Compute Metrics Extended Gen9"
+       mdapi_supported_apis="VK OGL4 OCL IO BB"
+       underscore_name="compute_extended"
+       hw_config_guid="caf3596a-7bb1-4dec-b3b3-2a080d283b49"
+       chipset="BXT"
+       symbol_name="ComputeExtended"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu0_active"
+             units="percent"
+             symbol_name="Fpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active"
+             units="percent"
+             symbol_name="Fpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU AVG IPC Rate"
+             description="The average rate of IPC calculated for 2 FPU pipelines."
+             data_type="float"
+             max_equation="2"
+             equation="A 9 READ  A 10 READ  A 11 READ UADD  A 9 READ USUB FDIV 1 FADD"
+             underscore_name="eu_avg_ipc_rate"
+             units="number"
+             symbol_name="EuAvgIpcRate"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Typed Writes 0"
+             description="The subslice 0 typed writes."
+             data_type="uint64"
+             equation="C 0 READ"
+             underscore_name="typed_writes0"
+             units="messages"
+             symbol_name="TypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuTypedAtomics0"
+             description="The subslice 0 EU Typed Atomics subslice 0."
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="eu_typed_atomics0"
+             units="messages"
+             symbol_name="EuTypedAtomics0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Typed Atomics 0"
+             description="The subslice 0 typed atomics."
+             data_type="uint64"
+             equation="C 4 READ"
+             underscore_name="typed_atomics0"
+             units="messages"
+             symbol_name="TypedAtomics0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="TypedAtomicsPerCacheLine"
+             description="The ratio of EU typed atomics requests to L3 cache line writes."
+             data_type="float"
+             equation="$EuTypedAtomics0 $TypedAtomics0 FDIV"
+             underscore_name="typed_atomics_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="TypedAtomicsPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuUntypedReads0"
+             description="The subslice 0 EU Untyped Reads subslice 0."
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="eu_untyped_reads0"
+             units="messages"
+             symbol_name="EuUntypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Untyped Writes 0"
+             description="The subslice 0 untyped writes (including SLM writes)."
+             data_type="uint64"
+             equation="C 1 READ"
+             underscore_name="untyped_writes0"
+             units="messages"
+             symbol_name="UntypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuUntypedAtomics0"
+             description="The subslice 0 EU Untyped Atomics subslice 0."
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="eu_untyped_atomics0"
+             units="messages"
+             symbol_name="EuUntypedAtomics0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuUntypedWrites0"
+             description="The subslice 0 EU Untyped Writes subslice 0."
+             data_type="uint64"
+             equation="B 1 READ"
+             underscore_name="eu_untyped_writes0"
+             units="messages"
+             symbol_name="EuUntypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuA64UntypedWrites0"
+             description="The subslice 0 EU A64 Untyped Writes subslice 0."
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="eu_a64_untyped_writes0"
+             units="messages"
+             symbol_name="EuA64UntypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="UntypedWritesPerCacheLine"
+             description="The ratio of EU untyped write requests to L3 cache line writes."
+             data_type="float"
+             equation="$EuUntypedWrites0 $EuA64UntypedWrites0 UADD $UntypedWrites0 FDIV"
+             underscore_name="untyped_writes_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="UntypedWritesPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EuTypedWrites0"
+             description="The subslice 0 EU Typed Writes subslice 0."
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="eu_typed_writes0"
+             units="messages"
+             symbol_name="EuTypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="TypedWritesPerCacheLine"
+             description="The ratio of EU typed write requests to L3 cache line writes."
+             data_type="float"
+             equation="$EuTypedWrites0 $TypedWrites0 FDIV"
+             underscore_name="typed_writes_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="TypedWritesPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Typed Reads 0"
+             description="The subslice 0 typed reads."
+             data_type="uint64"
+             equation="C 2 READ"
+             underscore_name="typed_reads0"
+             units="messages"
+             symbol_name="TypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Untyped Reads 0"
+             description="The subslice 0 untyped reads (including SLM reads)."
+             data_type="uint64"
+             equation="C 3 READ"
+             underscore_name="untyped_reads0"
+             units="messages"
+             symbol_name="UntypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuA64UntypedReads0"
+             description="The subslice 0 EU A64 Untyped Reads subslice 0."
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="eu_a64_untyped_reads0"
+             units="messages"
+             symbol_name="EuA64UntypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EU Thread Occupancy"
+             description="The percentage of time in which hardware threads occupied EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ 8 UMUL $EuCoresTotalCount UDIV $EuThreadsCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_thread_occupancy"
+             units="percent"
+             symbol_name="EuThreadOccupancy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EuTypedReads0"
+             description="The subslice 0 EU Typed Reads subslice 0."
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="eu_typed_reads0"
+             units="messages"
+             symbol_name="EuTypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="UntypedReadsPerCacheLine"
+             description="The ratio of EU untyped read requests to L3 cache line reads."
+             data_type="float"
+             equation="$EuUntypedReads0 $EuA64UntypedReads0 UADD $UntypedReads0 FDIV"
+             underscore_name="untyped_reads_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="UntypedReadsPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="TypedReadsPerCacheLine"
+             description="The ratio of EU typed read requests to L3 cache line reads."
+             data_type="float"
+             equation="$EuTypedReads0 $TypedReads0 FDIV"
+             underscore_name="typed_reads_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="TypedReadsPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="EU Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_send_active"
+             units="percent"
+             symbol_name="EuSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x104F00E0" />
+        <register type="NOA" address="0x00009888" value="0x141C0160" />
+        <register type="NOA" address="0x00009888" value="0x161C0015" />
+        <register type="NOA" address="0x00009888" value="0x181C0120" />
+        <register type="NOA" address="0x00009888" value="0x002D5000" />
+        <register type="NOA" address="0x00009888" value="0x062D4000" />
+        <register type="NOA" address="0x00009888" value="0x082D5000" />
+        <register type="NOA" address="0x00009888" value="0x0A2D5000" />
+        <register type="NOA" address="0x00009888" value="0x0C2D5000" />
+        <register type="NOA" address="0x00009888" value="0x0E2D5000" />
+        <register type="NOA" address="0x00009888" value="0x022D5000" />
+        <register type="NOA" address="0x00009888" value="0x042D5000" />
+        <register type="NOA" address="0x00009888" value="0x0C2E5400" />
+        <register type="NOA" address="0x00009888" value="0x0E2E5515" />
+        <register type="NOA" address="0x00009888" value="0x102E0155" />
+        <register type="NOA" address="0x00009888" value="0x044CC000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C4CC000" />
+        <register type="NOA" address="0x00009888" value="0x0E4CC000" />
+        <register type="NOA" address="0x00009888" value="0x104C8000" />
+        <register type="NOA" address="0x00009888" value="0x124C8000" />
+        <register type="NOA" address="0x00009888" value="0x144C8000" />
+        <register type="NOA" address="0x00009888" value="0x164C2000" />
+        <register type="NOA" address="0x00009888" value="0x064CC000" />
+        <register type="NOA" address="0x00009888" value="0x084CC000" />
+        <register type="NOA" address="0x00009888" value="0x004EA000" />
+        <register type="NOA" address="0x00009888" value="0x064E8000" />
+        <register type="NOA" address="0x00009888" value="0x084EA000" />
+        <register type="NOA" address="0x00009888" value="0x0A4EA000" />
+        <register type="NOA" address="0x00009888" value="0x0C4EA000" />
+        <register type="NOA" address="0x00009888" value="0x0E4EA000" />
+        <register type="NOA" address="0x00009888" value="0x024EA000" />
+        <register type="NOA" address="0x00009888" value="0x044EA000" />
+        <register type="NOA" address="0x00009888" value="0x0E4F4B41" />
+        <register type="NOA" address="0x00009888" value="0x004F4200" />
+        <register type="NOA" address="0x00009888" value="0x024F404C" />
+        <register type="NOA" address="0x00009888" value="0x1C4F0000" />
+        <register type="NOA" address="0x00009888" value="0x1A4F0000" />
+        <register type="NOA" address="0x00009888" value="0x001B4000" />
+        <register type="NOA" address="0x00009888" value="0x061B8000" />
+        <register type="NOA" address="0x00009888" value="0x081BC000" />
+        <register type="NOA" address="0x00009888" value="0x0A1BC000" />
+        <register type="NOA" address="0x00009888" value="0x0C1BC000" />
+        <register type="NOA" address="0x00009888" value="0x041BC000" />
+        <register type="NOA" address="0x00009888" value="0x001C0031" />
+        <register type="NOA" address="0x00009888" value="0x061C1900" />
+        <register type="NOA" address="0x00009888" value="0x081C1A33" />
+        <register type="NOA" address="0x00009888" value="0x0A1C1B35" />
+        <register type="NOA" address="0x00009888" value="0x0C1C3337" />
+        <register type="NOA" address="0x00009888" value="0x041C31C7" />
+        <register type="NOA" address="0x00009888" value="0x180F5000" />
+        <register type="NOA" address="0x00009888" value="0x1A0FA8AA" />
+        <register type="NOA" address="0x00009888" value="0x1C0F0AAA" />
+        <register type="NOA" address="0x00009888" value="0x182C8000" />
+        <register type="NOA" address="0x00009888" value="0x1C2C6AAA" />
+        <register type="NOA" address="0x00009888" value="0x1E2C0001" />
+        <register type="NOA" address="0x00009888" value="0x1A2C2950" />
+        <register type="NOA" address="0x00009888" value="0x01938000" />
+        <register type="NOA" address="0x00009888" value="0x0F938000" />
+        <register type="NOA" address="0x00009888" value="0x1993AAAA" />
+        <register type="NOA" address="0x00009888" value="0x03938000" />
+        <register type="NOA" address="0x00009888" value="0x05938000" />
+        <register type="NOA" address="0x00009888" value="0x07938000" />
+        <register type="NOA" address="0x00009888" value="0x09938000" />
+        <register type="NOA" address="0x00009888" value="0x0B938000" />
+        <register type="NOA" address="0x00009888" value="0x13904000" />
+        <register type="NOA" address="0x00009888" value="0x21904000" />
+        <register type="NOA" address="0x00009888" value="0x23904000" />
+        <register type="NOA" address="0x00009888" value="0x25904000" />
+        <register type="NOA" address="0x00009888" value="0x27904000" />
+        <register type="NOA" address="0x00009888" value="0x29904000" />
+        <register type="NOA" address="0x00009888" value="0x2B904000" />
+        <register type="NOA" address="0x00009888" value="0x2D904000" />
+        <register type="NOA" address="0x00009888" value="0x2F904000" />
+        <register type="NOA" address="0x00009888" value="0x31904000" />
+        <register type="NOA" address="0x00009888" value="0x15904000" />
+        <register type="NOA" address="0x00009888" value="0x17904000" />
+        <register type="NOA" address="0x00009888" value="0x19904000" />
+        <register type="NOA" address="0x00009888" value="0x1B904000" />
+        <register type="NOA" address="0x00009888" value="0x1D904000" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x43900420" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x47900000" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900000" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900400" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4D900001" />
+        <register type="NOA" address="0x00009888" value="0x45900001" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007FC2A" />
+        <register type="OA" address="0x00002774" value="0x0000BF00" />
+        <register type="OA" address="0x00002778" value="0x0007FC6A" />
+        <register type="OA" address="0x0000277C" value="0x0000BF00" />
+        <register type="OA" address="0x00002780" value="0x0007FC92" />
+        <register type="OA" address="0x00002784" value="0x0000BF00" />
+        <register type="OA" address="0x00002788" value="0x0007FCA2" />
+        <register type="OA" address="0x0000278C" value="0x0000BF00" />
+        <register type="OA" address="0x00002790" value="0x0007FC32" />
+        <register type="OA" address="0x00002794" value="0x0000BF00" />
+        <register type="OA" address="0x00002798" value="0x0007FC9A" />
+        <register type="OA" address="0x0000279C" value="0x0000BF00" />
+        <register type="OA" address="0x000027A0" value="0x0007FE6A" />
+        <register type="OA" address="0x000027A4" value="0x0000BF00" />
+        <register type="OA" address="0x000027A8" value="0x0007FE7A" />
+        <register type="OA" address="0x000027AC" value="0x0000BF00" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00000003" />
+        <register type="FLEX" address="0x0000E658" value="0x00002001" />
+        <register type="FLEX" address="0x0000E758" value="0x00778008" />
+        <register type="FLEX" address="0x0000E45C" value="0x00088078" />
+        <register type="FLEX" address="0x0000E55C" value="0x00808708" />
+        <register type="FLEX" address="0x0000E65C" value="0x00A08908" />
+    </register_config>
+  </set>
+
+  <set name="Compute Metrics L3 Cache Gen9"
+       mdapi_supported_apis="VK OGL4 OCL IO BB"
+       underscore_name="compute_l3_cache"
+       hw_config_guid="49b956e2-d5b9-47e0-9d8a-cee5e8cec527"
+       chipset="BXT"
+       symbol_name="ComputeL3Cache"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Bank 03 Accesses"
+             description="The total number of accesses to L3 Bank 03."
+             data_type="uint64"
+             equation="B 3 READ 2 UMUL"
+             underscore_name="l3_bank03_accesses"
+             units="messages"
+             symbol_name="L3Bank03Accesses"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="L3 Accesses"
+             description="The total number of L3 accesses from all entities."
+             data_type="uint64"
+             equation="C 0 READ C 1 READ B 2 READ B 3 READ UADD UADD UADD 2 UMUL"
+             underscore_name="l3_accesses"
+             units="messages"
+             symbol_name="L3Accesses"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Sampler Throughput"
+             description="The total number of GPU memory bytes transferred between samplers and L3 caches."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 29 READ 64 UMUL"
+             underscore_name="l3_sampler_throughput"
+             units="bytes"
+             symbol_name="L3SamplerThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Sampler"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu0_active"
+             units="percent"
+             symbol_name="Fpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active"
+             units="percent"
+             symbol_name="Fpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU AVG IPC Rate"
+             description="The average rate of IPC calculated for 2 FPU pipelines."
+             data_type="float"
+             max_equation="2"
+             equation="A 9 READ  A 10 READ  A 11 READ UADD  A 9 READ USUB FDIV 1 FADD"
+             underscore_name="eu_avg_ipc_rate"
+             units="number"
+             symbol_name="EuAvgIpcRate"
+             semantic_type="ratio"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Binary Instruction"
+             description="The percentage of time in which execution units were actively processing binary instructions on FPU0."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_binary_fpu0_instruction"
+             units="percent"
+             symbol_name="EuBinaryFpu0Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="EU FPU0 Hybrid Instruction"
+             description="The percentage of time in which execution units were actively processing hybrid instructions on FPU0."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_hybrid_fpu0_instruction"
+             units="percent"
+             symbol_name="EuHybridFpu0Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Misses"
+             description="The total number of L3 misses."
+             data_type="uint64"
+             equation="C 4 READ C 5 READ UADD"
+             underscore_name="l3_misses"
+             units="messages"
+             symbol_name="L3Misses"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/TAG"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="L3 Bank 00 Accesses"
+             description="The total number of accesses to L3 Bank 00."
+             data_type="uint64"
+             equation="C 0 READ 2 UMUL"
+             underscore_name="l3_bank00_accesses"
+             units="messages"
+             symbol_name="L3Bank00Accesses"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="EU FPU0 Move Instruction"
+             description="The percentage of time in which execution units were actively processing move instructions on FPU0."
+             data_type="float"
+             max_equation="100"
+             equation="A 19 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_move_fpu0_instruction"
+             units="percent"
+             symbol_name="EuMoveFpu0Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU FPU1 Hybrid Instruction"
+             description="The percentage of time in which execution units were actively processing hybrid instructions on FPU1."
+             data_type="float"
+             max_equation="100"
+             equation="A 14 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_hybrid_fpu1_instruction"
+             units="percent"
+             symbol_name="EuHybridFpu1Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Read Throughput"
+             description="The total number of GPU memory bytes read from GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="C 6 READ 64 UMUL"
+             underscore_name="gti_read_throughput"
+             units="bytes"
+             symbol_name="GtiReadThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI L3 Throughput"
+             description="The total number of GPU memory bytes transferred between L3 caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 4 READ C 5 READ UADD 64 UMUL"
+             underscore_name="gti_l3_throughput"
+             units="bytes"
+             symbol_name="GtiL3Throughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Bank 00 IC Accesses"
+             description="The total number of accesses to L3 Bank 00 from IC cache."
+             data_type="uint64"
+             equation="B 0 READ B 1 READ UADD 2 UMUL $L3Bank00Accesses UMIN"
+             underscore_name="l3_bank00_ic_accesses"
+             units="messages"
+             symbol_name="L3Bank00IcAccesses"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3/IC"
+             />
+    <counter name="L3 Bank 00 IC Hits"
+             description="The total number of hits in L3 Bank 00 from IC cache."
+             data_type="uint64"
+             equation="B 1 READ 2 UMUL $L3Bank00IcAccesses UMIN"
+             underscore_name="l3_bank00_ic_hits"
+             units="messages"
+             symbol_name="L3Bank00IcHits"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3/IC"
+             />
+    <counter name="Sampler Accesses"
+             description="The total number of messages send to samplers."
+             data_type="uint64"
+             equation="A 28 READ"
+             underscore_name="sampler_accesses"
+             units="messages"
+             symbol_name="SamplerAccesses"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler"
+             />
+    <counter name="L3 Bank 01 Accesses"
+             description="The total number of accesses to L3 Bank 01."
+             data_type="uint64"
+             equation="C 1 READ 2 UMUL"
+             underscore_name="l3_bank01_accesses"
+             units="messages"
+             symbol_name="L3Bank01Accesses"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Ternary Instruction"
+             description="The percentage of time in which execution units were actively processing ternary instructions on FPU0."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_ternary_fpu0_instruction"
+             units="percent"
+             symbol_name="EuTernaryFpu0Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU FPU1 Move Instruction"
+             description="The percentage of time in which execution units were actively processing move instructions on FPU1."
+             data_type="float"
+             max_equation="100"
+             equation="A 20 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_move_fpu1_instruction"
+             units="percent"
+             symbol_name="EuMoveFpu1Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="L3 Bank 02 Accesses"
+             description="The total number of accesses to L3 Bank 02."
+             data_type="uint64"
+             equation="B 2 READ 2 UMUL"
+             underscore_name="l3_bank02_accesses"
+             units="messages"
+             symbol_name="L3Bank02Accesses"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="L3 Total Throughput"
+             description="The total number of GPU memory bytes transferred via L3."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="$L3Accesses 64 UMUL"
+             underscore_name="l3_total_throughput"
+             units="bytes"
+             symbol_name="L3TotalThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Write Throughput"
+             description="The total number of GPU memory bytes written to GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 32 UMUL"
+             equation="C 7 READ 64 UMUL"
+             underscore_name="gti_write_throughput"
+             units="bytes"
+             symbol_name="GtiWriteThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="EU FPU1 Binary Instruction"
+             description="The percentage of time in which execution units were actively processing binary instructions on FPU1."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_binary_fpu1_instruction"
+             units="percent"
+             symbol_name="EuBinaryFpu1Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Ternary Instruction"
+             description="The percentage of time in which execution units were actively processing ternary instructions on FPU1."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_ternary_fpu1_instruction"
+             units="percent"
+             symbol_name="EuTernaryFpu1Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_send_active"
+             units="percent"
+             symbol_name="EuSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x166C03B0" />
+        <register type="NOA" address="0x00009888" value="0x1593001E" />
+        <register type="NOA" address="0x00009888" value="0x3F900C00" />
+        <register type="NOA" address="0x00009888" value="0x41900000" />
+        <register type="NOA" address="0x00009888" value="0x002D1000" />
+        <register type="NOA" address="0x00009888" value="0x062D4000" />
+        <register type="NOA" address="0x00009888" value="0x082D5000" />
+        <register type="NOA" address="0x00009888" value="0x0E2D5000" />
+        <register type="NOA" address="0x00009888" value="0x0C2E0400" />
+        <register type="NOA" address="0x00009888" value="0x0E2E1500" />
+        <register type="NOA" address="0x00009888" value="0x102E0140" />
+        <register type="NOA" address="0x00009888" value="0x044C4000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C4CC000" />
+        <register type="NOA" address="0x00009888" value="0x144C8000" />
+        <register type="NOA" address="0x00009888" value="0x164C2000" />
+        <register type="NOA" address="0x00009888" value="0x004E2000" />
+        <register type="NOA" address="0x00009888" value="0x064E8000" />
+        <register type="NOA" address="0x00009888" value="0x084EA000" />
+        <register type="NOA" address="0x00009888" value="0x0E4EA000" />
+        <register type="NOA" address="0x00009888" value="0x1A4F4001" />
+        <register type="NOA" address="0x00009888" value="0x1C4F5005" />
+        <register type="NOA" address="0x00009888" value="0x006C0051" />
+        <register type="NOA" address="0x00009888" value="0x066C5000" />
+        <register type="NOA" address="0x00009888" value="0x086C5C5D" />
+        <register type="NOA" address="0x00009888" value="0x0E6C5E5F" />
+        <register type="NOA" address="0x00009888" value="0x106C0000" />
+        <register type="NOA" address="0x00009888" value="0x146C0000" />
+        <register type="NOA" address="0x00009888" value="0x1A6C0000" />
+        <register type="NOA" address="0x00009888" value="0x1C6C0000" />
+        <register type="NOA" address="0x00009888" value="0x180F1000" />
+        <register type="NOA" address="0x00009888" value="0x1A0FA800" />
+        <register type="NOA" address="0x00009888" value="0x1C0F0A00" />
+        <register type="NOA" address="0x00009888" value="0x182C4000" />
+        <register type="NOA" address="0x00009888" value="0x1C2C4015" />
+        <register type="NOA" address="0x00009888" value="0x1E2C0001" />
+        <register type="NOA" address="0x00009888" value="0x03931980" />
+        <register type="NOA" address="0x00009888" value="0x05930032" />
+        <register type="NOA" address="0x00009888" value="0x11930000" />
+        <register type="NOA" address="0x00009888" value="0x01938000" />
+        <register type="NOA" address="0x00009888" value="0x0F938000" />
+        <register type="NOA" address="0x00009888" value="0x1993A00A" />
+        <register type="NOA" address="0x00009888" value="0x07930000" />
+        <register type="NOA" address="0x00009888" value="0x09930000" />
+        <register type="NOA" address="0x00009888" value="0x1D900177" />
+        <register type="NOA" address="0x00009888" value="0x1F900178" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x13904000" />
+        <register type="NOA" address="0x00009888" value="0x21904000" />
+        <register type="NOA" address="0x00009888" value="0x23904000" />
+        <register type="NOA" address="0x00009888" value="0x25904000" />
+        <register type="NOA" address="0x00009888" value="0x2F904000" />
+        <register type="NOA" address="0x00009888" value="0x31904000" />
+        <register type="NOA" address="0x00009888" value="0x19904000" />
+        <register type="NOA" address="0x00009888" value="0x1B904000" />
+        <register type="NOA" address="0x00009888" value="0x53901000" />
+        <register type="NOA" address="0x00009888" value="0x43900000" />
+        <register type="NOA" address="0x00009888" value="0x55900111" />
+        <register type="NOA" address="0x00009888" value="0x47900001" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900000" />
+        <register type="NOA" address="0x00009888" value="0x4D900000" />
+        <register type="NOA" address="0x00009888" value="0x45900400" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x30800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x30800000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007FFFA" />
+        <register type="OA" address="0x00002774" value="0x0000FEFE" />
+        <register type="OA" address="0x00002778" value="0x0007FFFA" />
+        <register type="OA" address="0x0000277C" value="0x0000FEFD" />
+        <register type="OA" address="0x00002790" value="0x0007FFFA" />
+        <register type="OA" address="0x00002794" value="0x0000FBEF" />
+        <register type="OA" address="0x00002798" value="0x0007FFFA" />
+        <register type="OA" address="0x0000279C" value="0x0000FBDF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00000003" />
+        <register type="FLEX" address="0x0000E658" value="0x00002001" />
+        <register type="FLEX" address="0x0000E758" value="0x00101100" />
+        <register type="FLEX" address="0x0000E45C" value="0x00201200" />
+        <register type="FLEX" address="0x0000E55C" value="0x00301300" />
+        <register type="FLEX" address="0x0000E65C" value="0x00401400" />
+    </register_config>
+  </set>
+
+  <set name="Metric set HDCAndSF"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="hdc_and_sf"
+       hw_config_guid="ad9d9bc2-ccb7-4f5d-adbb-b4e67e615efd"
+       chipset="BXT"
+       symbol_name="HDCAndSF"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="Polygon Data Ready"
+             description="The percentage of time in which geometry pipeline output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="poly_data_ready"
+             units="percent"
+             symbol_name="PolyDataReady"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe/Strip-Fans"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="HDC stalled by L3 (s0.ss1)"
+             description="Percentage of time when HDC has messges to L3, but it's stalled due to lack of credits (s0.ss1)"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ C 4 READ USUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader01_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader01AccessStalledOnL3"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="HDC stalled by L3 (s0.ss0)"
+             description="Percentage of time when HDC has messges to L3, but it's stalled due to lack of credits (s0.ss0)"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ C 6 READ USUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader00_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader00AccessStalledOnL3"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x104F0232" />
+        <register type="NOA" address="0x00009888" value="0x124F4640" />
+        <register type="NOA" address="0x00009888" value="0x11834400" />
+        <register type="NOA" address="0x00009888" value="0x022D4000" />
+        <register type="NOA" address="0x00009888" value="0x042D5000" />
+        <register type="NOA" address="0x00009888" value="0x062D1000" />
+        <register type="NOA" address="0x00009888" value="0x0E2E0055" />
+        <register type="NOA" address="0x00009888" value="0x064C8000" />
+        <register type="NOA" address="0x00009888" value="0x084CC000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C4000" />
+        <register type="NOA" address="0x00009888" value="0x024E8000" />
+        <register type="NOA" address="0x00009888" value="0x044EA000" />
+        <register type="NOA" address="0x00009888" value="0x064E2000" />
+        <register type="NOA" address="0x00009888" value="0x024F6100" />
+        <register type="NOA" address="0x00009888" value="0x044F416B" />
+        <register type="NOA" address="0x00009888" value="0x064F004B" />
+        <register type="NOA" address="0x00009888" value="0x1A4F0000" />
+        <register type="NOA" address="0x00009888" value="0x1A0F02A8" />
+        <register type="NOA" address="0x00009888" value="0x1A2C5500" />
+        <register type="NOA" address="0x00009888" value="0x0F808000" />
+        <register type="NOA" address="0x00009888" value="0x25810020" />
+        <register type="NOA" address="0x00009888" value="0x0F8305C0" />
+        <register type="NOA" address="0x00009888" value="0x07938000" />
+        <register type="NOA" address="0x00009888" value="0x09938000" />
+        <register type="NOA" address="0x00009888" value="0x0B938000" />
+        <register type="NOA" address="0x00009888" value="0x0D938000" />
+        <register type="NOA" address="0x00009888" value="0x1F951000" />
+        <register type="NOA" address="0x00009888" value="0x13920200" />
+        <register type="NOA" address="0x00009888" value="0x31908000" />
+        <register type="NOA" address="0x00009888" value="0x19904000" />
+        <register type="NOA" address="0x00009888" value="0x1B904000" />
+        <register type="NOA" address="0x00009888" value="0x1D904000" />
+        <register type="NOA" address="0x00009888" value="0x1F904000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x4D900003" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900000" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x47900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x10800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00000002" />
+        <register type="OA" address="0x00002774" value="0x0000FDFF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set L3_1"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="l3_1"
+       hw_config_guid="bde7b434-349c-4aad-8596-eb23c0352168"
+       chipset="BXT"
+       symbol_name="L3_1"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank1 Active"
+             description="The percentage of time in which slice0 L3 bank1 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank1_active"
+             units="percent"
+             symbol_name="L30Bank1Active"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="Slice0 L3 Bank1 Stalled"
+             description="The percentage of time in which slice0 L3 bank1 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank1_stalled"
+             units="percent"
+             symbol_name="L30Bank1Stalled"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank0 Active"
+             description="The percentage of time in which slice0 L3 bank0 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank0_active"
+             units="percent"
+             symbol_name="L30Bank0Active"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank0 Stalled"
+             description="The percentage of time in which slice0 L3 bank0 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank0_stalled"
+             units="percent"
+             symbol_name="L30Bank0Stalled"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA"
+                     availability="$SkuRevisionId 0x03 UGTE"
+                     priority="0"
+                     >
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x12643400" />
+        <register type="NOA" address="0x00009888" value="0x12653400" />
+        <register type="NOA" address="0x00009888" value="0x106C6800" />
+        <register type="NOA" address="0x00009888" value="0x126C001E" />
+        <register type="NOA" address="0x00009888" value="0x166C0010" />
+        <register type="NOA" address="0x00009888" value="0x0C2D5000" />
+        <register type="NOA" address="0x00009888" value="0x0E2D5000" />
+        <register type="NOA" address="0x00009888" value="0x002D4000" />
+        <register type="NOA" address="0x00009888" value="0x022D5000" />
+        <register type="NOA" address="0x00009888" value="0x042D5000" />
+        <register type="NOA" address="0x00009888" value="0x062D1000" />
+        <register type="NOA" address="0x00009888" value="0x102E0154" />
+        <register type="NOA" address="0x00009888" value="0x0C2E5000" />
+        <register type="NOA" address="0x00009888" value="0x0E2E0055" />
+        <register type="NOA" address="0x00009888" value="0x104C8000" />
+        <register type="NOA" address="0x00009888" value="0x124C8000" />
+        <register type="NOA" address="0x00009888" value="0x144C8000" />
+        <register type="NOA" address="0x00009888" value="0x164C2000" />
+        <register type="NOA" address="0x00009888" value="0x044C8000" />
+        <register type="NOA" address="0x00009888" value="0x064CC000" />
+        <register type="NOA" address="0x00009888" value="0x084CC000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C4000" />
+        <register type="NOA" address="0x00009888" value="0x0C4EA000" />
+        <register type="NOA" address="0x00009888" value="0x0E4EA000" />
+        <register type="NOA" address="0x00009888" value="0x004E8000" />
+        <register type="NOA" address="0x00009888" value="0x024EA000" />
+        <register type="NOA" address="0x00009888" value="0x044EA000" />
+        <register type="NOA" address="0x00009888" value="0x064E2000" />
+        <register type="NOA" address="0x00009888" value="0x1C4F5500" />
+        <register type="NOA" address="0x00009888" value="0x1A4F1554" />
+        <register type="NOA" address="0x00009888" value="0x0A640024" />
+        <register type="NOA" address="0x00009888" value="0x10640000" />
+        <register type="NOA" address="0x00009888" value="0x04640000" />
+        <register type="NOA" address="0x00009888" value="0x0C650024" />
+        <register type="NOA" address="0x00009888" value="0x10650000" />
+        <register type="NOA" address="0x00009888" value="0x06650000" />
+        <register type="NOA" address="0x00009888" value="0x0C6C5327" />
+        <register type="NOA" address="0x00009888" value="0x0E6C5425" />
+        <register type="NOA" address="0x00009888" value="0x006C2A00" />
+        <register type="NOA" address="0x00009888" value="0x026C285B" />
+        <register type="NOA" address="0x00009888" value="0x046C005C" />
+        <register type="NOA" address="0x00009888" value="0x1C6C0000" />
+        <register type="NOA" address="0x00009888" value="0x1A6C0900" />
+        <register type="NOA" address="0x00009888" value="0x1C0F0AA0" />
+        <register type="NOA" address="0x00009888" value="0x180F4000" />
+        <register type="NOA" address="0x00009888" value="0x1A0F02AA" />
+        <register type="NOA" address="0x00009888" value="0x1C2C5400" />
+        <register type="NOA" address="0x00009888" value="0x1E2C0001" />
+        <register type="NOA" address="0x00009888" value="0x1A2C5550" />
+        <register type="NOA" address="0x00009888" value="0x1993AA00" />
+        <register type="NOA" address="0x00009888" value="0x03938000" />
+        <register type="NOA" address="0x00009888" value="0x05938000" />
+        <register type="NOA" address="0x00009888" value="0x07938000" />
+        <register type="NOA" address="0x00009888" value="0x09938000" />
+        <register type="NOA" address="0x00009888" value="0x0B938000" />
+        <register type="NOA" address="0x00009888" value="0x0D938000" />
+        <register type="NOA" address="0x00009888" value="0x2B904000" />
+        <register type="NOA" address="0x00009888" value="0x2D904000" />
+        <register type="NOA" address="0x00009888" value="0x2F904000" />
+        <register type="NOA" address="0x00009888" value="0x31904000" />
+        <register type="NOA" address="0x00009888" value="0x15904000" />
+        <register type="NOA" address="0x00009888" value="0x17904000" />
+        <register type="NOA" address="0x00009888" value="0x19904000" />
+        <register type="NOA" address="0x00009888" value="0x1B904000" />
+        <register type="NOA" address="0x00009888" value="0x1D904000" />
+        <register type="NOA" address="0x00009888" value="0x1F904000" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900421" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4D900001" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x43900420" />
+        <register type="NOA" address="0x00009888" value="0x45900021" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x47900000" />
+    </register_config>
+    <register_config type="NOA"
+                     availability="$SkuRevisionId 0x03 ULT"
+                     priority="0"
+                     >
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x14640340" />
+        <register type="NOA" address="0x00009888" value="0x14650340" />
+        <register type="NOA" address="0x00009888" value="0x106C6800" />
+        <register type="NOA" address="0x00009888" value="0x126C001E" />
+        <register type="NOA" address="0x00009888" value="0x166C0010" />
+        <register type="NOA" address="0x00009888" value="0x0C2D5000" />
+        <register type="NOA" address="0x00009888" value="0x0E2D5000" />
+        <register type="NOA" address="0x00009888" value="0x002D4000" />
+        <register type="NOA" address="0x00009888" value="0x022D5000" />
+        <register type="NOA" address="0x00009888" value="0x042D5000" />
+        <register type="NOA" address="0x00009888" value="0x062D1000" />
+        <register type="NOA" address="0x00009888" value="0x102E0154" />
+        <register type="NOA" address="0x00009888" value="0x0C2E5000" />
+        <register type="NOA" address="0x00009888" value="0x0E2E0055" />
+        <register type="NOA" address="0x00009888" value="0x104C8000" />
+        <register type="NOA" address="0x00009888" value="0x124C8000" />
+        <register type="NOA" address="0x00009888" value="0x144C8000" />
+        <register type="NOA" address="0x00009888" value="0x164C2000" />
+        <register type="NOA" address="0x00009888" value="0x044C8000" />
+        <register type="NOA" address="0x00009888" value="0x064CC000" />
+        <register type="NOA" address="0x00009888" value="0x084CC000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C4000" />
+        <register type="NOA" address="0x00009888" value="0x0C4EA000" />
+        <register type="NOA" address="0x00009888" value="0x0E4EA000" />
+        <register type="NOA" address="0x00009888" value="0x004E8000" />
+        <register type="NOA" address="0x00009888" value="0x024EA000" />
+        <register type="NOA" address="0x00009888" value="0x044EA000" />
+        <register type="NOA" address="0x00009888" value="0x064E2000" />
+        <register type="NOA" address="0x00009888" value="0x1C4F5500" />
+        <register type="NOA" address="0x00009888" value="0x1A4F1554" />
+        <register type="NOA" address="0x00009888" value="0x04642400" />
+        <register type="NOA" address="0x00009888" value="0x22640000" />
+        <register type="NOA" address="0x00009888" value="0x1A640000" />
+        <register type="NOA" address="0x00009888" value="0x06650024" />
+        <register type="NOA" address="0x00009888" value="0x22650000" />
+        <register type="NOA" address="0x00009888" value="0x1C650000" />
+        <register type="NOA" address="0x00009888" value="0x0C6C5327" />
+        <register type="NOA" address="0x00009888" value="0x0E6C5425" />
+        <register type="NOA" address="0x00009888" value="0x006C2A00" />
+        <register type="NOA" address="0x00009888" value="0x026C285B" />
+        <register type="NOA" address="0x00009888" value="0x046C005C" />
+        <register type="NOA" address="0x00009888" value="0x1C6C0000" />
+        <register type="NOA" address="0x00009888" value="0x1A6C0900" />
+        <register type="NOA" address="0x00009888" value="0x1C0F0AA0" />
+        <register type="NOA" address="0x00009888" value="0x180F4000" />
+        <register type="NOA" address="0x00009888" value="0x1A0F02AA" />
+        <register type="NOA" address="0x00009888" value="0x1C2C5400" />
+        <register type="NOA" address="0x00009888" value="0x1E2C0001" />
+        <register type="NOA" address="0x00009888" value="0x1A2C5550" />
+        <register type="NOA" address="0x00009888" value="0x1993AA00" />
+        <register type="NOA" address="0x00009888" value="0x03938000" />
+        <register type="NOA" address="0x00009888" value="0x05938000" />
+        <register type="NOA" address="0x00009888" value="0x07938000" />
+        <register type="NOA" address="0x00009888" value="0x09938000" />
+        <register type="NOA" address="0x00009888" value="0x0B938000" />
+        <register type="NOA" address="0x00009888" value="0x0D938000" />
+        <register type="NOA" address="0x00009888" value="0x2B904000" />
+        <register type="NOA" address="0x00009888" value="0x2D904000" />
+        <register type="NOA" address="0x00009888" value="0x2F904000" />
+        <register type="NOA" address="0x00009888" value="0x31904000" />
+        <register type="NOA" address="0x00009888" value="0x15904000" />
+        <register type="NOA" address="0x00009888" value="0x17904000" />
+        <register type="NOA" address="0x00009888" value="0x19904000" />
+        <register type="NOA" address="0x00009888" value="0x1B904000" />
+        <register type="NOA" address="0x00009888" value="0x1D904000" />
+        <register type="NOA" address="0x00009888" value="0x1F904000" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900421" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4D900001" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x43900420" />
+        <register type="NOA" address="0x00009888" value="0x45900021" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x47900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002770" value="0x00100070" />
+        <register type="OA" address="0x00002774" value="0x0000FFF1" />
+        <register type="OA" address="0x00002778" value="0x00014002" />
+        <register type="OA" address="0x0000277C" value="0x0000C3FF" />
+        <register type="OA" address="0x00002780" value="0x00010002" />
+        <register type="OA" address="0x00002784" value="0x0000C7FF" />
+        <register type="OA" address="0x00002788" value="0x00004002" />
+        <register type="OA" address="0x0000278C" value="0x0000D3FF" />
+        <register type="OA" address="0x00002790" value="0x00100700" />
+        <register type="OA" address="0x00002794" value="0x0000FF1F" />
+        <register type="OA" address="0x00002798" value="0x00001402" />
+        <register type="OA" address="0x0000279C" value="0x0000FC3F" />
+        <register type="OA" address="0x000027A0" value="0x00001002" />
+        <register type="OA" address="0x000027A4" value="0x0000FC7F" />
+        <register type="OA" address="0x000027A8" value="0x00000402" />
+        <register type="OA" address="0x000027AC" value="0x0000FD3F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set RasterizerAndPixelBackend"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="rasterizer_and_pixel_backend"
+       hw_config_guid="f3d845e6-bfc3-4ffe-b0e5-dddc80c21f07"
+       chipset="BXT"
+       symbol_name="RasterizerAndPixelBackend"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Slice0 Pixel Values Ready"
+             description="The percentage of time in which slice0 pixel values are ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="pixel_values0_ready"
+             units="percent"
+             symbol_name="PixelValues0Ready"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="Slice0 Rasterizer Input Available"
+             description="The percentage of time in which slice0 rasterizer input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="rasterizer0_input_available"
+             units="percent"
+             symbol_name="Rasterizer0InputAvailable"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Slice0 Post-EarlyZ Pixel Data Ready"
+             description="The percentage of time in which slice0 post-EarlyZ pixel data is ready (after early Z tests have been applied)"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="pixel_data0_ready"
+             units="percent"
+             symbol_name="PixelData0Ready"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer/Early Depth Test"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 Rasterizer Output Ready"
+             description="The percentage of time in which slice0 rasterizer output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="rasterizer0_output_ready"
+             units="percent"
+             symbol_name="Rasterizer0OutputReady"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Slice0 PS Output Available"
+             description="The percentage of time in which slice0 PS output is available"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_output0_available"
+             units="percent"
+             symbol_name="PSOutput0Available"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x102D7800" />
+        <register type="NOA" address="0x00009888" value="0x122D79E0" />
+        <register type="NOA" address="0x00009888" value="0x0C2F0004" />
+        <register type="NOA" address="0x00009888" value="0x100E3800" />
+        <register type="NOA" address="0x00009888" value="0x180F0005" />
+        <register type="NOA" address="0x00009888" value="0x002D0940" />
+        <register type="NOA" address="0x00009888" value="0x022D802F" />
+        <register type="NOA" address="0x00009888" value="0x042D4013" />
+        <register type="NOA" address="0x00009888" value="0x062D1000" />
+        <register type="NOA" address="0x00009888" value="0x0E2E0050" />
+        <register type="NOA" address="0x00009888" value="0x022F0010" />
+        <register type="NOA" address="0x00009888" value="0x002F0000" />
+        <register type="NOA" address="0x00009888" value="0x084C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C4000" />
+        <register type="NOA" address="0x00009888" value="0x044E8000" />
+        <register type="NOA" address="0x00009888" value="0x064E2000" />
+        <register type="NOA" address="0x00009888" value="0x040E0480" />
+        <register type="NOA" address="0x00009888" value="0x000E0000" />
+        <register type="NOA" address="0x00009888" value="0x060F0027" />
+        <register type="NOA" address="0x00009888" value="0x100F0000" />
+        <register type="NOA" address="0x00009888" value="0x1A0F0040" />
+        <register type="NOA" address="0x00009888" value="0x03938000" />
+        <register type="NOA" address="0x00009888" value="0x05938000" />
+        <register type="NOA" address="0x00009888" value="0x07938000" />
+        <register type="NOA" address="0x00009888" value="0x09938000" />
+        <register type="NOA" address="0x00009888" value="0x0B938000" />
+        <register type="NOA" address="0x00009888" value="0x0D938000" />
+        <register type="NOA" address="0x00009888" value="0x15904000" />
+        <register type="NOA" address="0x00009888" value="0x17904000" />
+        <register type="NOA" address="0x00009888" value="0x19904000" />
+        <register type="NOA" address="0x00009888" value="0x1B904000" />
+        <register type="NOA" address="0x00009888" value="0x1D904000" />
+        <register type="NOA" address="0x00009888" value="0x1F904000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x439014A0" />
+        <register type="NOA" address="0x00009888" value="0x459000A4" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x47900001" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x30800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00000002" />
+        <register type="OA" address="0x00002774" value="0x0000EFFF" />
+        <register type="OA" address="0x00002778" value="0x00006000" />
+        <register type="OA" address="0x0000277C" value="0x0000F3FF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set Sampler"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="sampler"
+       hw_config_guid="a53d620b-c14e-49df-bd27-e076b3fb98f3"
+       chipset="BXT"
+       symbol_name="Sampler"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 Subslice2 Input Available"
+             description="The percentage of time in which slice0 subslice2 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler02_input_available"
+             units="percent"
+             symbol_name="Sampler02InputAvailable"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 Subslice0 Input Available"
+             description="The percentage of time in which slice0 subslice0 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler00_input_available"
+             units="percent"
+             symbol_name="Sampler00InputAvailable"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="Slice0 Subslice2 Sampler Output Ready"
+             description="The percentage of time in which slice0 subslice2 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler02_output_ready"
+             units="percent"
+             symbol_name="Sampler02OutputReady"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Slice0 Subslice1 Input Available"
+             description="The percentage of time in which slice0 subslice1 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler01_input_available"
+             units="percent"
+             symbol_name="Sampler01InputAvailable"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Slice0 Subslice0 Sampler Output Ready"
+             description="The percentage of time in which slice0 subslice0 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler00_output_ready"
+             units="percent"
+             symbol_name="Sampler00OutputReady"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Slice0 Subslice1 Sampler Output Ready"
+             description="The percentage of time in which slice0 subslice1 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler01_output_ready"
+             units="percent"
+             symbol_name="Sampler01OutputReady"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x121300A0" />
+        <register type="NOA" address="0x00009888" value="0x141600AB" />
+        <register type="NOA" address="0x00009888" value="0x123300A0" />
+        <register type="NOA" address="0x00009888" value="0x143600AB" />
+        <register type="NOA" address="0x00009888" value="0x125300A0" />
+        <register type="NOA" address="0x00009888" value="0x145600AB" />
+        <register type="NOA" address="0x00009888" value="0x0C2D4000" />
+        <register type="NOA" address="0x00009888" value="0x0E2D5000" />
+        <register type="NOA" address="0x00009888" value="0x002D4000" />
+        <register type="NOA" address="0x00009888" value="0x022D5000" />
+        <register type="NOA" address="0x00009888" value="0x042D5000" />
+        <register type="NOA" address="0x00009888" value="0x062D1000" />
+        <register type="NOA" address="0x00009888" value="0x102E01A0" />
+        <register type="NOA" address="0x00009888" value="0x0C2E5000" />
+        <register type="NOA" address="0x00009888" value="0x0E2E0065" />
+        <register type="NOA" address="0x00009888" value="0x164C2000" />
+        <register type="NOA" address="0x00009888" value="0x044C8000" />
+        <register type="NOA" address="0x00009888" value="0x064CC000" />
+        <register type="NOA" address="0x00009888" value="0x084C4000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C4000" />
+        <register type="NOA" address="0x00009888" value="0x0E4E8000" />
+        <register type="NOA" address="0x00009888" value="0x004E8000" />
+        <register type="NOA" address="0x00009888" value="0x024EA000" />
+        <register type="NOA" address="0x00009888" value="0x044E2000" />
+        <register type="NOA" address="0x00009888" value="0x064E2000" />
+        <register type="NOA" address="0x00009888" value="0x1C0F0800" />
+        <register type="NOA" address="0x00009888" value="0x180F4000" />
+        <register type="NOA" address="0x00009888" value="0x1A0F023F" />
+        <register type="NOA" address="0x00009888" value="0x1E2C0003" />
+        <register type="NOA" address="0x00009888" value="0x1A2CC030" />
+        <register type="NOA" address="0x00009888" value="0x04132180" />
+        <register type="NOA" address="0x00009888" value="0x02130000" />
+        <register type="NOA" address="0x00009888" value="0x0C148000" />
+        <register type="NOA" address="0x00009888" value="0x0E142000" />
+        <register type="NOA" address="0x00009888" value="0x04148000" />
+        <register type="NOA" address="0x00009888" value="0x1E150140" />
+        <register type="NOA" address="0x00009888" value="0x1C150040" />
+        <register type="NOA" address="0x00009888" value="0x0C163000" />
+        <register type="NOA" address="0x00009888" value="0x0E160068" />
+        <register type="NOA" address="0x00009888" value="0x10160000" />
+        <register type="NOA" address="0x00009888" value="0x18160000" />
+        <register type="NOA" address="0x00009888" value="0x0A164000" />
+        <register type="NOA" address="0x00009888" value="0x04330043" />
+        <register type="NOA" address="0x00009888" value="0x02330000" />
+        <register type="NOA" address="0x00009888" value="0x0234A000" />
+        <register type="NOA" address="0x00009888" value="0x04342000" />
+        <register type="NOA" address="0x00009888" value="0x1C350015" />
+        <register type="NOA" address="0x00009888" value="0x02363460" />
+        <register type="NOA" address="0x00009888" value="0x10360000" />
+        <register type="NOA" address="0x00009888" value="0x04360000" />
+        <register type="NOA" address="0x00009888" value="0x06360000" />
+        <register type="NOA" address="0x00009888" value="0x08364000" />
+        <register type="NOA" address="0x00009888" value="0x06530043" />
+        <register type="NOA" address="0x00009888" value="0x02530000" />
+        <register type="NOA" address="0x00009888" value="0x0E548000" />
+        <register type="NOA" address="0x00009888" value="0x00548000" />
+        <register type="NOA" address="0x00009888" value="0x06542000" />
+        <register type="NOA" address="0x00009888" value="0x1E550400" />
+        <register type="NOA" address="0x00009888" value="0x1A552000" />
+        <register type="NOA" address="0x00009888" value="0x1C550100" />
+        <register type="NOA" address="0x00009888" value="0x0E563000" />
+        <register type="NOA" address="0x00009888" value="0x00563400" />
+        <register type="NOA" address="0x00009888" value="0x10560000" />
+        <register type="NOA" address="0x00009888" value="0x18560000" />
+        <register type="NOA" address="0x00009888" value="0x02560000" />
+        <register type="NOA" address="0x00009888" value="0x0C564000" />
+        <register type="NOA" address="0x00009888" value="0x1993A800" />
+        <register type="NOA" address="0x00009888" value="0x03938000" />
+        <register type="NOA" address="0x00009888" value="0x05938000" />
+        <register type="NOA" address="0x00009888" value="0x07938000" />
+        <register type="NOA" address="0x00009888" value="0x09938000" />
+        <register type="NOA" address="0x00009888" value="0x0B938000" />
+        <register type="NOA" address="0x00009888" value="0x0D938000" />
+        <register type="NOA" address="0x00009888" value="0x2D904000" />
+        <register type="NOA" address="0x00009888" value="0x2F904000" />
+        <register type="NOA" address="0x00009888" value="0x31904000" />
+        <register type="NOA" address="0x00009888" value="0x15904000" />
+        <register type="NOA" address="0x00009888" value="0x17904000" />
+        <register type="NOA" address="0x00009888" value="0x19904000" />
+        <register type="NOA" address="0x00009888" value="0x1B904000" />
+        <register type="NOA" address="0x00009888" value="0x1D904000" />
+        <register type="NOA" address="0x00009888" value="0x1F904000" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x4B9014A0" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4D900001" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x43900820" />
+        <register type="NOA" address="0x00009888" value="0x45901022" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x47900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x70800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x0000C000" />
+        <register type="OA" address="0x00002774" value="0x0000E7FF" />
+        <register type="OA" address="0x00002778" value="0x00003000" />
+        <register type="OA" address="0x0000277C" value="0x0000F9FF" />
+        <register type="OA" address="0x00002780" value="0x00000C00" />
+        <register type="OA" address="0x00002784" value="0x0000FE7F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set TDL_1"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="tdl_1"
+       hw_config_guid="8a44b172-6e1d-445f-8937-c06cc487ba39"
+       chipset="BXT"
+       symbol_name="TDL_1"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="NonPS Thread Ready For Dispatch on Slice0 Subslice2"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice2 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread02_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread02ReadyForDispatch"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="NonPS Thread Ready For Dispatch on Slice0 Subslice0"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice0 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread00_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread00ReadyForDispatch"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Subslice0"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice0 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread00_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread00ReadyForDispatch"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Subslice1"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice1 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread01_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread01ReadyForDispatch"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Subslice2"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice2 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread02_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread02ReadyForDispatch"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="NonPS Thread Ready For Dispatch on Slice0 Subslice1"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice1 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread01_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread01ReadyForDispatch"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x141A0000" />
+        <register type="NOA" address="0x00009888" value="0x143A0000" />
+        <register type="NOA" address="0x00009888" value="0x145A0000" />
+        <register type="NOA" address="0x00009888" value="0x0C2D4000" />
+        <register type="NOA" address="0x00009888" value="0x0E2D5000" />
+        <register type="NOA" address="0x00009888" value="0x002D4000" />
+        <register type="NOA" address="0x00009888" value="0x022D5000" />
+        <register type="NOA" address="0x00009888" value="0x042D5000" />
+        <register type="NOA" address="0x00009888" value="0x062D1000" />
+        <register type="NOA" address="0x00009888" value="0x102E0150" />
+        <register type="NOA" address="0x00009888" value="0x0C2E5000" />
+        <register type="NOA" address="0x00009888" value="0x0E2E006A" />
+        <register type="NOA" address="0x00009888" value="0x124C8000" />
+        <register type="NOA" address="0x00009888" value="0x144C8000" />
+        <register type="NOA" address="0x00009888" value="0x164C2000" />
+        <register type="NOA" address="0x00009888" value="0x044C8000" />
+        <register type="NOA" address="0x00009888" value="0x064C4000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C4000" />
+        <register type="NOA" address="0x00009888" value="0x0C4E8000" />
+        <register type="NOA" address="0x00009888" value="0x0E4EA000" />
+        <register type="NOA" address="0x00009888" value="0x004E8000" />
+        <register type="NOA" address="0x00009888" value="0x024E2000" />
+        <register type="NOA" address="0x00009888" value="0x064E2000" />
+        <register type="NOA" address="0x00009888" value="0x1C0F0BC0" />
+        <register type="NOA" address="0x00009888" value="0x180F4000" />
+        <register type="NOA" address="0x00009888" value="0x1A0F0302" />
+        <register type="NOA" address="0x00009888" value="0x1E2C0003" />
+        <register type="NOA" address="0x00009888" value="0x1A2C00F0" />
+        <register type="NOA" address="0x00009888" value="0x021A3080" />
+        <register type="NOA" address="0x00009888" value="0x041A31E5" />
+        <register type="NOA" address="0x00009888" value="0x02148000" />
+        <register type="NOA" address="0x00009888" value="0x0414A000" />
+        <register type="NOA" address="0x00009888" value="0x1C150054" />
+        <register type="NOA" address="0x00009888" value="0x06168000" />
+        <register type="NOA" address="0x00009888" value="0x08168000" />
+        <register type="NOA" address="0x00009888" value="0x0A168000" />
+        <register type="NOA" address="0x00009888" value="0x0C3A3280" />
+        <register type="NOA" address="0x00009888" value="0x0E3A0063" />
+        <register type="NOA" address="0x00009888" value="0x063A0061" />
+        <register type="NOA" address="0x00009888" value="0x023A0000" />
+        <register type="NOA" address="0x00009888" value="0x0C348000" />
+        <register type="NOA" address="0x00009888" value="0x0E342000" />
+        <register type="NOA" address="0x00009888" value="0x06342000" />
+        <register type="NOA" address="0x00009888" value="0x1E350140" />
+        <register type="NOA" address="0x00009888" value="0x1C350100" />
+        <register type="NOA" address="0x00009888" value="0x18360028" />
+        <register type="NOA" address="0x00009888" value="0x0C368000" />
+        <register type="NOA" address="0x00009888" value="0x0E5A3080" />
+        <register type="NOA" address="0x00009888" value="0x005A3280" />
+        <register type="NOA" address="0x00009888" value="0x025A0063" />
+        <register type="NOA" address="0x00009888" value="0x0E548000" />
+        <register type="NOA" address="0x00009888" value="0x00548000" />
+        <register type="NOA" address="0x00009888" value="0x02542000" />
+        <register type="NOA" address="0x00009888" value="0x1E550400" />
+        <register type="NOA" address="0x00009888" value="0x1A552000" />
+        <register type="NOA" address="0x00009888" value="0x1C550001" />
+        <register type="NOA" address="0x00009888" value="0x18560080" />
+        <register type="NOA" address="0x00009888" value="0x02568000" />
+        <register type="NOA" address="0x00009888" value="0x04568000" />
+        <register type="NOA" address="0x00009888" value="0x1993A800" />
+        <register type="NOA" address="0x00009888" value="0x03938000" />
+        <register type="NOA" address="0x00009888" value="0x05938000" />
+        <register type="NOA" address="0x00009888" value="0x07938000" />
+        <register type="NOA" address="0x00009888" value="0x09938000" />
+        <register type="NOA" address="0x00009888" value="0x0B938000" />
+        <register type="NOA" address="0x00009888" value="0x0D938000" />
+        <register type="NOA" address="0x00009888" value="0x2D904000" />
+        <register type="NOA" address="0x00009888" value="0x2F904000" />
+        <register type="NOA" address="0x00009888" value="0x31904000" />
+        <register type="NOA" address="0x00009888" value="0x15904000" />
+        <register type="NOA" address="0x00009888" value="0x17904000" />
+        <register type="NOA" address="0x00009888" value="0x19904000" />
+        <register type="NOA" address="0x00009888" value="0x1B904000" />
+        <register type="NOA" address="0x00009888" value="0x1D904000" />
+        <register type="NOA" address="0x00009888" value="0x1F904000" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900420" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4D900000" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x43900000" />
+        <register type="NOA" address="0x00009888" value="0x45901084" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x47900001" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x30800000" />
+        <register type="OA" address="0x00002770" value="0x00000002" />
+        <register type="OA" address="0x00002774" value="0x00007FFF" />
+        <register type="OA" address="0x00002778" value="0x00000000" />
+        <register type="OA" address="0x0000277C" value="0x00009FFF" />
+        <register type="OA" address="0x00002780" value="0x00000002" />
+        <register type="OA" address="0x00002784" value="0x0000EFFF" />
+        <register type="OA" address="0x00002788" value="0x00000000" />
+        <register type="OA" address="0x0000278C" value="0x0000F3FF" />
+        <register type="OA" address="0x00002790" value="0x00000002" />
+        <register type="OA" address="0x00002794" value="0x0000FDFF" />
+        <register type="OA" address="0x00002798" value="0x00000000" />
+        <register type="OA" address="0x0000279C" value="0x0000FE7F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set TDL_2"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="tdl_2"
+       hw_config_guid="9d4643f8-aa05-482e-8193-070a8ab0d117"
+       chipset="BXT"
+       symbol_name="TDL_2"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice1 Port 0"
+             description="The percentage of time in which thread header is ready on slice0 subslice1 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header01_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader01ReadyPort0"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice1 Port 1"
+             description="The percentage of time in which thread header is ready on slice0 subslice1 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header01_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader01ReadyPort1"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice2 Port 1"
+             description="The percentage of time in which thread header is ready on slice0 subslice2 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header02_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader02ReadyPort1"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice2 Port 0"
+             description="The percentage of time in which thread header is ready on slice0 subslice2 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header02_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader02ReadyPort0"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice0 Port 0"
+             description="The percentage of time in which thread header is ready on slice0 subslice0 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header00_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader00ReadyPort0"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice0 Port 1"
+             description="The percentage of time in which thread header is ready on slice0 subslice0 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header00_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader00ReadyPort1"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x141A026B" />
+        <register type="NOA" address="0x00009888" value="0x143A0173" />
+        <register type="NOA" address="0x00009888" value="0x145A026B" />
+        <register type="NOA" address="0x00009888" value="0x002D4000" />
+        <register type="NOA" address="0x00009888" value="0x022D5000" />
+        <register type="NOA" address="0x00009888" value="0x042D5000" />
+        <register type="NOA" address="0x00009888" value="0x062D1000" />
+        <register type="NOA" address="0x00009888" value="0x0C2E5000" />
+        <register type="NOA" address="0x00009888" value="0x0E2E0069" />
+        <register type="NOA" address="0x00009888" value="0x044C8000" />
+        <register type="NOA" address="0x00009888" value="0x064CC000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C4000" />
+        <register type="NOA" address="0x00009888" value="0x004E8000" />
+        <register type="NOA" address="0x00009888" value="0x024EA000" />
+        <register type="NOA" address="0x00009888" value="0x064E2000" />
+        <register type="NOA" address="0x00009888" value="0x180F6000" />
+        <register type="NOA" address="0x00009888" value="0x1A0F030A" />
+        <register type="NOA" address="0x00009888" value="0x1A2C03C0" />
+        <register type="NOA" address="0x00009888" value="0x041A37E7" />
+        <register type="NOA" address="0x00009888" value="0x021A0000" />
+        <register type="NOA" address="0x00009888" value="0x0414A000" />
+        <register type="NOA" address="0x00009888" value="0x1C150050" />
+        <register type="NOA" address="0x00009888" value="0x08168000" />
+        <register type="NOA" address="0x00009888" value="0x0A168000" />
+        <register type="NOA" address="0x00009888" value="0x003A3380" />
+        <register type="NOA" address="0x00009888" value="0x063A006F" />
+        <register type="NOA" address="0x00009888" value="0x023A0000" />
+        <register type="NOA" address="0x00009888" value="0x00348000" />
+        <register type="NOA" address="0x00009888" value="0x06342000" />
+        <register type="NOA" address="0x00009888" value="0x1A352000" />
+        <register type="NOA" address="0x00009888" value="0x1C350100" />
+        <register type="NOA" address="0x00009888" value="0x02368000" />
+        <register type="NOA" address="0x00009888" value="0x0C368000" />
+        <register type="NOA" address="0x00009888" value="0x025A37E7" />
+        <register type="NOA" address="0x00009888" value="0x0254A000" />
+        <register type="NOA" address="0x00009888" value="0x1C550005" />
+        <register type="NOA" address="0x00009888" value="0x04568000" />
+        <register type="NOA" address="0x00009888" value="0x06568000" />
+        <register type="NOA" address="0x00009888" value="0x03938000" />
+        <register type="NOA" address="0x00009888" value="0x05938000" />
+        <register type="NOA" address="0x00009888" value="0x07938000" />
+        <register type="NOA" address="0x00009888" value="0x09938000" />
+        <register type="NOA" address="0x00009888" value="0x0B938000" />
+        <register type="NOA" address="0x00009888" value="0x0D938000" />
+        <register type="NOA" address="0x00009888" value="0x15904000" />
+        <register type="NOA" address="0x00009888" value="0x17904000" />
+        <register type="NOA" address="0x00009888" value="0x19904000" />
+        <register type="NOA" address="0x00009888" value="0x1B904000" />
+        <register type="NOA" address="0x00009888" value="0x1D904000" />
+        <register type="NOA" address="0x00009888" value="0x1F904000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x43900020" />
+        <register type="NOA" address="0x00009888" value="0x45901080" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x47900001" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Compute Metrics Extra Gen9"
+       mdapi_supported_apis="VK OGL4 OCL IO BB"
+       underscore_name="compute_extra"
+       hw_config_guid="fa6ecf21-2cb8-4d0b-9308-6e4a7b4ca87a"
+       chipset="BXT"
+       symbol_name="ComputeExtra"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active"
+             units="percent"
+             symbol_name="Fpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Pipe Active including Ext Math"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing including Extended Math processing"
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ  C 7 READ C 6 READ FADD C 5 READ FADD 8 FMUL FADD 100 FMUL $EuCoresTotalCount FDIV $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active_adjusted"
+             units="percent"
+             symbol_name="Fpu1ActiveAdjusted"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x141A001F" />
+        <register type="NOA" address="0x00009888" value="0x143A001F" />
+        <register type="NOA" address="0x00009888" value="0x145A001F" />
+        <register type="NOA" address="0x00009888" value="0x042D5000" />
+        <register type="NOA" address="0x00009888" value="0x062D1000" />
+        <register type="NOA" address="0x00009888" value="0x0E2E0094" />
+        <register type="NOA" address="0x00009888" value="0x084CC000" />
+        <register type="NOA" address="0x00009888" value="0x044EA000" />
+        <register type="NOA" address="0x00009888" value="0x1A0F00E0" />
+        <register type="NOA" address="0x00009888" value="0x1A2C0C00" />
+        <register type="NOA" address="0x00009888" value="0x061A0063" />
+        <register type="NOA" address="0x00009888" value="0x021A0000" />
+        <register type="NOA" address="0x00009888" value="0x06142000" />
+        <register type="NOA" address="0x00009888" value="0x1C150100" />
+        <register type="NOA" address="0x00009888" value="0x0C168000" />
+        <register type="NOA" address="0x00009888" value="0x043A3180" />
+        <register type="NOA" address="0x00009888" value="0x023A0000" />
+        <register type="NOA" address="0x00009888" value="0x04348000" />
+        <register type="NOA" address="0x00009888" value="0x1C350040" />
+        <register type="NOA" address="0x00009888" value="0x0A368000" />
+        <register type="NOA" address="0x00009888" value="0x045A0063" />
+        <register type="NOA" address="0x00009888" value="0x025A0000" />
+        <register type="NOA" address="0x00009888" value="0x04542000" />
+        <register type="NOA" address="0x00009888" value="0x1C550010" />
+        <register type="NOA" address="0x00009888" value="0x08568000" />
+        <register type="NOA" address="0x00009888" value="0x09938000" />
+        <register type="NOA" address="0x00009888" value="0x0B938000" />
+        <register type="NOA" address="0x00009888" value="0x0D938000" />
+        <register type="NOA" address="0x00009888" value="0x1B904000" />
+        <register type="NOA" address="0x00009888" value="0x1D904000" />
+        <register type="NOA" address="0x00009888" value="0x1F904000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900400" />
+        <register type="NOA" address="0x00009888" value="0x47900004" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00001000" />
+        <register type="FLEX" address="0x0000E558" value="0x00003002" />
+        <register type="FLEX" address="0x0000E658" value="0x00005004" />
+        <register type="FLEX" address="0x0000E758" value="0x00011010" />
+        <register type="FLEX" address="0x0000E45C" value="0x00050012" />
+        <register type="FLEX" address="0x0000E55C" value="0x00052051" />
+        <register type="FLEX" address="0x0000E65C" value="0x00000008" />
+    </register_config>
+  </set>
+
+  <set name="Gpu Rings Busyness"
+       mdapi_supported_apis="VK OGL OCL MEDIA IO BB"
+       underscore_name="gpu_busyness"
+       hw_config_guid="c9f5fa3a-d14f-400c-a89a-211206b00ee7"
+       chipset="BXT"
+       symbol_name="GpuBusyness"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="Vebox Ring Busy"
+             description="The percentage of time when vebox command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vebox_busy"
+             units="percent"
+             symbol_name="VeboxBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Render Ring Busy"
+             description="The percentage of time when render command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="render_busy"
+             units="percent"
+             symbol_name="RenderBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Vdbox0 Ring Busy"
+             description="The percentage of time when Vdbox0 command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vdbox0_busy"
+             units="percent"
+             symbol_name="Vdbox0Busy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Blitter Ring Busy"
+             description="The percentage of time when blitter command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="blitter_busy"
+             units="percent"
+             symbol_name="BlitterBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="AnyRingBusy"
+             description="The percentage of time when any command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="any_ring_busy"
+             units="percent"
+             symbol_name="AnyRingBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x13805800" />
+        <register type="NOA" address="0x00009888" value="0x05962C00" />
+        <register type="NOA" address="0x00009888" value="0x19950016" />
+        <register type="NOA" address="0x00009888" value="0x21C05800" />
+        <register type="NOA" address="0x00009888" value="0x07800035" />
+        <register type="NOA" address="0x00009888" value="0x11800000" />
+        <register type="NOA" address="0x00009888" value="0x23810008" />
+        <register type="NOA" address="0x00009888" value="0x07960025" />
+        <register type="NOA" address="0x00009888" value="0x1D960000" />
+        <register type="NOA" address="0x00009888" value="0x0F960000" />
+        <register type="NOA" address="0x00009888" value="0x0B934000" />
+        <register type="NOA" address="0x00009888" value="0x09948000" />
+        <register type="NOA" address="0x00009888" value="0x05950085" />
+        <register type="NOA" address="0x00009888" value="0x11950000" />
+        <register type="NOA" address="0x00009888" value="0x1D950400" />
+        <register type="NOA" address="0x00009888" value="0x0B924000" />
+        <register type="NOA" address="0x00009888" value="0x0D922000" />
+        <register type="NOA" address="0x00009888" value="0x0F922000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B908000" />
+        <register type="NOA" address="0x00009888" value="0x1D904000" />
+        <register type="NOA" address="0x00009888" value="0x1F908000" />
+        <register type="NOA" address="0x00009888" value="0x0BC000A5" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900442" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x47900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x10800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00078000" />
+        <register type="OA" address="0x00002774" value="0x00000FFF" />
+    </register_config>
+  </set>
+
+  <set name="MDAPI testing set Gen9"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="test_oa"
+       hw_config_guid="5ee72f5c-092f-421e-8b70-225f7c3e9612"
+       chipset="BXT"
+       symbol_name="TestOa"
+       >
+    <counter name="TestCounter7"
+             description="HW test counter 7. Factor: 0.666"
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="counter7"
+             units="events"
+             symbol_name="Counter7"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="TestCounter8"
+             description="HW test counter 8. Should be equal to 1."
+             data_type="uint64"
+             equation="C 7 READ"
+             underscore_name="counter8"
+             units="events"
+             symbol_name="Counter8"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter4"
+             description="HW test counter 4. Factor: 0.333"
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="counter4"
+             units="events"
+             symbol_name="Counter4"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter5"
+             description="HW test counter 5. Factor: 0.333"
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="counter5"
+             units="events"
+             symbol_name="Counter5"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter6"
+             description="HW test counter 6. Factor: 0.166"
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="counter6"
+             units="events"
+             symbol_name="Counter6"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter3"
+             description="HW test counter 3. Factor: 0.5"
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="counter3"
+             units="events"
+             symbol_name="Counter3"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter0"
+             description="HW test counter 0. Factor: 0.0"
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="counter0"
+             units="events"
+             symbol_name="Counter0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter1"
+             description="HW test counter 1. Factor: 1.0"
+             data_type="uint64"
+             equation="B 1 READ"
+             underscore_name="counter1"
+             units="events"
+             symbol_name="Counter1"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter2"
+             description="HW test counter 2. Factor: 1.0"
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="counter2"
+             units="events"
+             symbol_name="Counter2"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x19800000" />
+        <register type="NOA" address="0x00009888" value="0x07800063" />
+        <register type="NOA" address="0x00009888" value="0x11800000" />
+        <register type="NOA" address="0x00009888" value="0x23810008" />
+        <register type="NOA" address="0x00009888" value="0x1D950400" />
+        <register type="NOA" address="0x00009888" value="0x0F922000" />
+        <register type="NOA" address="0x00009888" value="0x1F908000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x47900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x00000004" />
+        <register type="OA" address="0x00002774" value="0x00000000" />
+        <register type="OA" address="0x00002778" value="0x00000003" />
+        <register type="OA" address="0x0000277C" value="0x00000000" />
+        <register type="OA" address="0x00002780" value="0x00000007" />
+        <register type="OA" address="0x00002784" value="0x00000000" />
+        <register type="OA" address="0x00002788" value="0x00100002" />
+        <register type="OA" address="0x0000278C" value="0x0000FFF7" />
+        <register type="OA" address="0x00002790" value="0x00100002" />
+        <register type="OA" address="0x00002794" value="0x0000FFCF" />
+        <register type="OA" address="0x00002798" value="0x00100082" />
+        <register type="OA" address="0x0000279C" value="0x0000FFEF" />
+        <register type="OA" address="0x000027A0" value="0x001000C2" />
+        <register type="OA" address="0x000027A4" value="0x0000FFE7" />
+        <register type="OA" address="0x000027A8" value="0x00100001" />
+        <register type="OA" address="0x000027AC" value="0x0000FFE7" />
+    </register_config>
+  </set>
+
+  <set name="Metric set PMA Stall"
+       mdapi_supported_apis="VK OGL OGL4 OCL IO MEDIA"
+       underscore_name="pma__stall"
+       hw_config_guid="d49cd0d8-8c7f-4465-94fc-51e08c9050bc"
+       chipset="BXT"
+       symbol_name="PMA_Stall"
+       >
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="STC PMA stall"
+             description="Percentage of time when stencil cache line and an overlapping pixel are causing stalls"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ B 1 READ FADD 2 FDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="stc_pma_stall"
+             units="percent"
+             symbol_name="StcPMAStall"
+             availability="$SliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_group="GPU/Stencil Cache"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x124C3080" />
+        <register type="NOA" address="0x00009888" value="0x002D1000" />
+        <register type="NOA" address="0x00009888" value="0x062D4000" />
+        <register type="NOA" address="0x00009888" value="0x082D5000" />
+        <register type="NOA" address="0x00009888" value="0x0A2D5000" />
+        <register type="NOA" address="0x00009888" value="0x0C2E0400" />
+        <register type="NOA" address="0x00009888" value="0x0E2E5500" />
+        <register type="NOA" address="0x00009888" value="0x102E0001" />
+        <register type="NOA" address="0x00009888" value="0x004C0045" />
+        <register type="NOA" address="0x00009888" value="0x064C2300" />
+        <register type="NOA" address="0x00009888" value="0x084C26C4" />
+        <register type="NOA" address="0x00009888" value="0x0A4C264E" />
+        <register type="NOA" address="0x00009888" value="0x164C0000" />
+        <register type="NOA" address="0x00009888" value="0x044C0000" />
+        <register type="NOA" address="0x00009888" value="0x0C4C0000" />
+        <register type="NOA" address="0x00009888" value="0x0E4C0000" />
+        <register type="NOA" address="0x00009888" value="0x01938000" />
+        <register type="NOA" address="0x00009888" value="0x0F938000" />
+        <register type="NOA" address="0x00009888" value="0x199300AA" />
+        <register type="NOA" address="0x00009888" value="0x13904000" />
+        <register type="NOA" address="0x00009888" value="0x21904000" />
+        <register type="NOA" address="0x00009888" value="0x23904000" />
+        <register type="NOA" address="0x00009888" value="0x25904000" />
+        <register type="NOA" address="0x00009888" value="0x27904000" />
+        <register type="NOA" address="0x00009888" value="0x29904000" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x43900000" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x47900000" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x30800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00E00021" />
+        <register type="OA" address="0x00002774" value="0x0007FFF8" />
+        <register type="OA" address="0x00002778" value="0x07000101" />
+        <register type="OA" address="0x0000277C" value="0x0038FFC7" />
+    </register_config>
+  </set>
+
+</metrics>
diff --git a/lib/i915/perf-configs/oa-cflgt2.xml b/lib/i915/perf-configs/oa-cflgt2.xml
new file mode 100644
index 00000000..6a9a73df
--- /dev/null
+++ b/lib/i915/perf-configs/oa-cflgt2.xml
@@ -0,0 +1,10866 @@
+<?xml version="1.0"?>
+<metrics version="1581935520" merge_md5="">
+  <set name="Render Metrics Basic Gen9"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="render_basic"
+       hw_config_guid="7fa796a4-0c7a-4201-afc6-cff0b2f528a2"
+       chipset="CFLGT2"
+       symbol_name="RenderBasic"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Misses"
+             description="The total number of L3 misses."
+             data_type="uint64"
+             equation="C 4 READ"
+             underscore_name="l3_misses"
+             units="messages"
+             symbol_name="L3Misses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/TAG"
+             />
+    <counter name="GTI L3 Throughput"
+             description="The total number of GPU memory bytes transferred between L3 caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="$L3Misses 64 UMUL"
+             underscore_name="gti_l3_throughput"
+             units="bytes"
+             symbol_name="GtiL3Throughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Cache Misses"
+             description="The total number of sampler cache misses in all LODs in all sampler units."
+             data_type="uint64"
+             equation="B 4 READ 8 UMUL"
+             underscore_name="sampler_l1_misses"
+             units="messages"
+             symbol_name="SamplerL1Misses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler 1 Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which Sampler 1 has been slowing down the pipe when processing EU requests."
+             data_type="float"
+             high_watermark="15"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="sampler1_bottleneck"
+             units="percent"
+             symbol_name="Sampler1Bottleneck"
+             availability="$SubsliceMask 0x12 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="L3 Sampler Throughput"
+             description="The total number of GPU memory bytes transferred between samplers and L3 caches."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="$SamplerL1Misses 64 UMUL"
+             underscore_name="l3_sampler_throughput"
+             units="bytes"
+             symbol_name="L3SamplerThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Sampler"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Sampler 0 Busy"
+             description="The percentage of time in which Sampler 0 has been processing EU requests."
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler0_busy"
+             units="percent"
+             symbol_name="Sampler0Busy"
+             availability="$SubsliceMask 0x09 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Sampler 1 Busy"
+             description="The percentage of time in which Sampler 1 has been processing EU requests."
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler1_busy"
+             units="percent"
+             symbol_name="Sampler1Busy"
+             availability="$SubsliceMask 0x12 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Samplers Busy"
+             description="The percentage of time in which samplers have been processing EU requests."
+             data_type="float"
+             max_equation="100"
+             equation="$Sampler0Busy $Sampler1Busy FMAX"
+             underscore_name="samplers_busy"
+             units="percent"
+             symbol_name="SamplersBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="GTI Fixed Pipe Throughput"
+             description="The total number of GPU memory bytes transferred between 3D Pipeline (Command Dispatch, Input Assembly and Stream Output) and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="B 6 READ B 7 READ UADD 64 UMUL"
+             underscore_name="gti_vf_throughput"
+             units="bytes"
+             symbol_name="GtiVfThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/3D Pipe"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler 0 Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which Sampler 0 has been slowing down the pipe when processing EU requests."
+             data_type="float"
+             high_watermark="15"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="sampler0_bottleneck"
+             units="percent"
+             symbol_name="Sampler0Bottleneck"
+             availability="$SubsliceMask 0x09 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="L3 Lookup Accesses w/o IC"
+             description="The total number of L3 cache lookup accesses w/o IC."
+             data_type="uint64"
+             equation="$SamplerL1Misses $ShaderMemoryAccesses UADD"
+             underscore_name="l3_lookups"
+             units="messages"
+             symbol_name="L3Lookups"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/TAG"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Read Throughput"
+             description="The total number of GPU memory bytes read from GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="C 6 READ 64 UMUL"
+             underscore_name="gti_read_throughput"
+             units="bytes"
+             symbol_name="GtiReadThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Depth Throughput"
+             description="The total number of GPU memory bytes transferred between depth caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 0 READ C 1 READ UADD 64 UMUL"
+             underscore_name="gti_depth_throughput"
+             units="bytes"
+             symbol_name="GtiDepthThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/Depth Cache"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Samplers Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which samplers have been slowing down the pipe when processing EU requests."
+             data_type="float"
+             high_watermark="15"
+             equation="$Sampler0Bottleneck $Sampler1Bottleneck FMAX"
+             max_equation="100"
+             underscore_name="sampler_bottleneck"
+             units="percent"
+             symbol_name="SamplerBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Indicate System Frame Batch Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="GTI HDC TLB Lookup Throughput"
+             description="The total number of GPU memory bytes transferred between GTI and HDC, when HDC is doing TLB lookups."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 5 READ 64 UMUL"
+             underscore_name="gti_hdc_lookups_throughput"
+             units="bytes"
+             symbol_name="GtiHdcLookupsThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI RCC Throughput"
+             description="The total number of GPU memory bytes transferred between render color caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 2 READ C 3 READ UADD 64 UMUL"
+             underscore_name="gti_rcc_throughput"
+             units="bytes"
+             symbol_name="GtiRccThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/Color Cache"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="GTI Write Throughput"
+             description="The total number of GPU memory bytes written to GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 32 UMUL"
+             equation="C 7 READ 64 UMUL"
+             underscore_name="gti_write_throughput"
+             units="bytes"
+             symbol_name="GtiWriteThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x166C01E0" />
+        <register type="NOA" address="0x00009888" value="0x12170280" />
+        <register type="NOA" address="0x00009888" value="0x12370280" />
+        <register type="NOA" address="0x00009888" value="0x11930317" />
+        <register type="NOA" address="0x00009888" value="0x159303DF" />
+        <register type="NOA" address="0x00009888" value="0x3F900003" />
+        <register type="NOA" address="0x00009888" value="0x1A4E0080" />
+        <register type="NOA" address="0x00009888" value="0x0A6C0053" />
+        <register type="NOA" address="0x00009888" value="0x106C0000" />
+        <register type="NOA" address="0x00009888" value="0x1C6C0000" />
+        <register type="NOA" address="0x00009888" value="0x0A1B4000" />
+        <register type="NOA" address="0x00009888" value="0x1C1C0001" />
+        <register type="NOA" address="0x00009888" value="0x002F1000" />
+        <register type="NOA" address="0x00009888" value="0x042F1000" />
+        <register type="NOA" address="0x00009888" value="0x004C4000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C8400" />
+        <register type="NOA" address="0x00009888" value="0x000D2000" />
+        <register type="NOA" address="0x00009888" value="0x060D8000" />
+        <register type="NOA" address="0x00009888" value="0x080DA000" />
+        <register type="NOA" address="0x00009888" value="0x0A0D2000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F0400" />
+        <register type="NOA" address="0x00009888" value="0x0E0F6600" />
+        <register type="NOA" address="0x00009888" value="0x002C8000" />
+        <register type="NOA" address="0x00009888" value="0x162C2200" />
+        <register type="NOA" address="0x00009888" value="0x062D8000" />
+        <register type="NOA" address="0x00009888" value="0x082D8000" />
+        <register type="NOA" address="0x00009888" value="0x00133000" />
+        <register type="NOA" address="0x00009888" value="0x08133000" />
+        <register type="NOA" address="0x00009888" value="0x00170020" />
+        <register type="NOA" address="0x00009888" value="0x08170021" />
+        <register type="NOA" address="0x00009888" value="0x10170000" />
+        <register type="NOA" address="0x00009888" value="0x0633C000" />
+        <register type="NOA" address="0x00009888" value="0x0833C000" />
+        <register type="NOA" address="0x00009888" value="0x06370800" />
+        <register type="NOA" address="0x00009888" value="0x08370840" />
+        <register type="NOA" address="0x00009888" value="0x10370000" />
+        <register type="NOA" address="0x00009888" value="0x0D933031" />
+        <register type="NOA" address="0x00009888" value="0x0F933E3F" />
+        <register type="NOA" address="0x00009888" value="0x01933D00" />
+        <register type="NOA" address="0x00009888" value="0x0393073C" />
+        <register type="NOA" address="0x00009888" value="0x0593000E" />
+        <register type="NOA" address="0x00009888" value="0x1D930000" />
+        <register type="NOA" address="0x00009888" value="0x19930000" />
+        <register type="NOA" address="0x00009888" value="0x1B930000" />
+        <register type="NOA" address="0x00009888" value="0x1D900157" />
+        <register type="NOA" address="0x00009888" value="0x1F900158" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x2B908000" />
+        <register type="NOA" address="0x00009888" value="0x2D908000" />
+        <register type="NOA" address="0x00009888" value="0x2F908000" />
+        <register type="NOA" address="0x00009888" value="0x31908000" />
+        <register type="NOA" address="0x00009888" value="0x15908000" />
+        <register type="NOA" address="0x00009888" value="0x17908000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B908000" />
+        <register type="NOA" address="0x00009888" value="0x1190001F" />
+        <register type="NOA" address="0x00009888" value="0x51904400" />
+        <register type="NOA" address="0x00009888" value="0x41900020" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900C21" />
+        <register type="NOA" address="0x00009888" value="0x47900061" />
+        <register type="NOA" address="0x00009888" value="0x57904440" />
+        <register type="NOA" address="0x00009888" value="0x49900000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900000" />
+        <register type="NOA" address="0x00009888" value="0x59900004" />
+        <register type="NOA" address="0x00009888" value="0x43900000" />
+        <register type="NOA" address="0x00009888" value="0x53904444" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00222222" />
+    </register_config>
+  </set>
+
+  <set name="Compute Metrics Basic Gen9"
+       mdapi_supported_apis="VK OGL4 OCL IO BB"
+       underscore_name="compute_basic"
+       hw_config_guid="a4985100-5f76-4822-8ca7-67908cb26274"
+       chipset="CFLGT2"
+       symbol_name="ComputeBasic"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Untyped Bytes Read"
+             description="The total number of typed memory bytes read via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="B 6 READ B 7 READ C 0 READ UADD UADD $EuSlicesTotalCount 64 UMUL UMUL"
+             underscore_name="untyped_bytes_read"
+             units="bytes"
+             symbol_name="UntypedBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Typed Bytes Written"
+             description="The total number of untyped memory bytes written via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="B 3 READ B 4 READ B 5 READ UADD UADD $EuSlicesTotalCount 64 UMUL UMUL"
+             underscore_name="typed_bytes_written"
+             units="bytes"
+             symbol_name="TypedBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu0_active"
+             units="percent"
+             symbol_name="Fpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active"
+             units="percent"
+             symbol_name="Fpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU AVG IPC Rate"
+             description="The average rate of IPC calculated for 2 FPU pipelines."
+             data_type="float"
+             max_equation="2"
+             equation="A 9 READ  A 10 READ  A 11 READ UADD  A 9 READ USUB FDIV 1 FADD"
+             underscore_name="eu_avg_ipc_rate"
+             units="number"
+             symbol_name="EuAvgIpcRate"
+             semantic_type="ratio"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Read Throughput"
+             description="The total number of GPU memory bytes read from GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 4 READ 64 UMUL"
+             underscore_name="gti_read_throughput"
+             units="bytes"
+             symbol_name="GtiReadThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Untyped Writes"
+             description="The total number of untyped memory bytes written via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 1 READ C 2 READ C 3 READ UADD UADD $EuSlicesTotalCount 64 UMUL UMUL"
+             underscore_name="untyped_bytes_written"
+             units="bytes"
+             symbol_name="UntypedBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="Typed Bytes Read"
+             description="The total number of typed memory bytes read via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="B 0 READ B 1 READ B 2 READ UADD UADD $EuSlicesTotalCount 64 UMUL UMUL"
+             underscore_name="typed_bytes_read"
+             units="bytes"
+             symbol_name="TypedBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="EU Thread Occupancy"
+             description="The percentage of time in which hardware threads occupied EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ 8 UMUL $EuCoresTotalCount UDIV $EuThreadsCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_thread_occupancy"
+             units="percent"
+             symbol_name="EuThreadOccupancy"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="GTI Write Throughput"
+             description="The total number of GPU memory bytes written to GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 32 UMUL"
+             equation="C 5 READ 64 UMUL"
+             underscore_name="gti_write_throughput"
+             units="bytes"
+             symbol_name="GtiWriteThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="EU Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_send_active"
+             units="percent"
+             symbol_name="EuSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x104F00E0" />
+        <register type="NOA" address="0x00009888" value="0x124F1C00" />
+        <register type="NOA" address="0x00009888" value="0x106C00E0" />
+        <register type="NOA" address="0x00009888" value="0x37906800" />
+        <register type="NOA" address="0x00009888" value="0x3F900003" />
+        <register type="NOA" address="0x00009888" value="0x004E8000" />
+        <register type="NOA" address="0x00009888" value="0x1A4E0820" />
+        <register type="NOA" address="0x00009888" value="0x1C4E0002" />
+        <register type="NOA" address="0x00009888" value="0x064F0900" />
+        <register type="NOA" address="0x00009888" value="0x084F0032" />
+        <register type="NOA" address="0x00009888" value="0x0A4F1891" />
+        <register type="NOA" address="0x00009888" value="0x0C4F0E00" />
+        <register type="NOA" address="0x00009888" value="0x0E4F003C" />
+        <register type="NOA" address="0x00009888" value="0x004F0D80" />
+        <register type="NOA" address="0x00009888" value="0x024F003B" />
+        <register type="NOA" address="0x00009888" value="0x006C0002" />
+        <register type="NOA" address="0x00009888" value="0x086C0100" />
+        <register type="NOA" address="0x00009888" value="0x0C6C000C" />
+        <register type="NOA" address="0x00009888" value="0x0E6C0B00" />
+        <register type="NOA" address="0x00009888" value="0x186C0000" />
+        <register type="NOA" address="0x00009888" value="0x1C6C0000" />
+        <register type="NOA" address="0x00009888" value="0x1E6C0000" />
+        <register type="NOA" address="0x00009888" value="0x001B4000" />
+        <register type="NOA" address="0x00009888" value="0x081B8000" />
+        <register type="NOA" address="0x00009888" value="0x0C1B4000" />
+        <register type="NOA" address="0x00009888" value="0x0E1B8000" />
+        <register type="NOA" address="0x00009888" value="0x101C8000" />
+        <register type="NOA" address="0x00009888" value="0x1A1C8000" />
+        <register type="NOA" address="0x00009888" value="0x1C1C0024" />
+        <register type="NOA" address="0x00009888" value="0x065B8000" />
+        <register type="NOA" address="0x00009888" value="0x085B4000" />
+        <register type="NOA" address="0x00009888" value="0x0A5BC000" />
+        <register type="NOA" address="0x00009888" value="0x0C5B8000" />
+        <register type="NOA" address="0x00009888" value="0x0E5B4000" />
+        <register type="NOA" address="0x00009888" value="0x005B8000" />
+        <register type="NOA" address="0x00009888" value="0x025B4000" />
+        <register type="NOA" address="0x00009888" value="0x1A5C6000" />
+        <register type="NOA" address="0x00009888" value="0x1C5C001B" />
+        <register type="NOA" address="0x00009888" value="0x125C8000" />
+        <register type="NOA" address="0x00009888" value="0x145C8000" />
+        <register type="NOA" address="0x00009888" value="0x004C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C2000" />
+        <register type="NOA" address="0x00009888" value="0x0C4C0208" />
+        <register type="NOA" address="0x00009888" value="0x000DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D8000" />
+        <register type="NOA" address="0x00009888" value="0x080DA000" />
+        <register type="NOA" address="0x00009888" value="0x0A0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0E0DA000" />
+        <register type="NOA" address="0x00009888" value="0x020D2000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F5400" />
+        <register type="NOA" address="0x00009888" value="0x0E0F5500" />
+        <register type="NOA" address="0x00009888" value="0x100F0155" />
+        <register type="NOA" address="0x00009888" value="0x002C8000" />
+        <register type="NOA" address="0x00009888" value="0x0E2CC000" />
+        <register type="NOA" address="0x00009888" value="0x162CFB00" />
+        <register type="NOA" address="0x00009888" value="0x182C00BE" />
+        <register type="NOA" address="0x00009888" value="0x022CC000" />
+        <register type="NOA" address="0x00009888" value="0x042CC000" />
+        <register type="NOA" address="0x00009888" value="0x19900157" />
+        <register type="NOA" address="0x00009888" value="0x1B900158" />
+        <register type="NOA" address="0x00009888" value="0x1D900105" />
+        <register type="NOA" address="0x00009888" value="0x1F900103" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x11900FFF" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900800" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900821" />
+        <register type="NOA" address="0x00009888" value="0x47900802" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900802" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900002" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x43900422" />
+        <register type="NOA" address="0x00009888" value="0x53904444" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00000003" />
+        <register type="FLEX" address="0x0000E658" value="0x00002001" />
+        <register type="FLEX" address="0x0000E758" value="0x00778008" />
+        <register type="FLEX" address="0x0000E45C" value="0x00088078" />
+        <register type="FLEX" address="0x0000E55C" value="0x00808708" />
+        <register type="FLEX" address="0x0000E65C" value="0x00222222" />
+    </register_config>
+  </set>
+
+  <set name="Render Metrics for 3D Pipeline Profile Gen9"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="render_pipe_profile"
+       hw_config_guid="2221e4d5-ed7b-445e-b2cc-3de1b97f4d42"
+       chipset="CFLGT2"
+       symbol_name="RenderPipeProfile"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Bottleneck"
+             low_watermark="10"
+             description="The percentage of time in which vertex shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="30"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_bottleneck"
+             units="percent"
+             symbol_name="VsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Hi-Depth Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which early hierarchical depth test pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="hi_depth_bottleneck"
+             units="percent"
+             symbol_name="HiDepthBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which geometry shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gs_bottleneck"
+             units="percent"
+             symbol_name="GsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Geometry Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="BC Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which barycentric coordinates calculation pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="bc_bottleneck"
+             units="percent"
+             symbol_name="BcBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Barycentric Calc"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HS Stall"
+             description="The percentage of time in which hull stall pipeline stage was stalled."
+             data_type="float"
+             equation="C 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="hs_stall"
+             units="percent"
+             symbol_name="HsStall"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Hull Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="VF Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which vertex fetch pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="C 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vf_bottleneck"
+             units="percent"
+             symbol_name="VfBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Input Assembler"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Strip-Fans Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which strip-fans pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="10"
+             equation="B 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sf_bottleneck"
+             units="percent"
+             symbol_name="SfBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Strip-Fans"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SF Stall"
+             description="The percentage of time in which strip-fans pipeline stage was stalled."
+             data_type="float"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sf_stall"
+             units="percent"
+             symbol_name="SfStall"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Strip-Fans"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HS Bottleneck"
+             low_watermark="3"
+             description="The percentage of time in which hull shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="9"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="hs_bottleneck"
+             units="percent"
+             symbol_name="HsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Hull Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="CL Stall"
+             description="The percentage of time in which clipper pipeline stage was stalled."
+             data_type="float"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="cl_stall"
+             units="percent"
+             symbol_name="ClStall"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Clipper"
+             />
+    <counter name="SO Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which stream output pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="so_bottleneck"
+             units="percent"
+             symbol_name="SoBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Stream Output"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="DS Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which domain shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ds_bottleneck"
+             units="percent"
+             symbol_name="DsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Domain Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Clipper Bottleneck"
+             low_watermark="10"
+             description="The percentage of time in which clipper pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="30"
+             equation="B 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="cl_bottleneck"
+             units="percent"
+             symbol_name="ClBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Clipper"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Stall"
+             description="The percentage of time in which domain shader pipeline stage was stalled."
+             data_type="float"
+             equation="C 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ds_stall"
+             units="percent"
+             symbol_name="DsStall"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Domain Shader"
+             />
+    <counter name="Early Depth Bottleneck"
+             low_watermark="10"
+             description="The percentage of time in which early depth test pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="30"
+             equation="B 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="early_depth_bottleneck"
+             units="percent"
+             symbol_name="EarlyDepthBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="SO Stall"
+             description="The percentage of time in which stream-output pipeline stage was stalled."
+             data_type="float"
+             equation="C 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="so_stall"
+             units="percent"
+             symbol_name="SoStall"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Stream Output"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x0C0E001F" />
+        <register type="NOA" address="0x00009888" value="0x0A0F0000" />
+        <register type="NOA" address="0x00009888" value="0x10116800" />
+        <register type="NOA" address="0x00009888" value="0x178A03E0" />
+        <register type="NOA" address="0x00009888" value="0x11824C00" />
+        <register type="NOA" address="0x00009888" value="0x11830020" />
+        <register type="NOA" address="0x00009888" value="0x13840020" />
+        <register type="NOA" address="0x00009888" value="0x11850019" />
+        <register type="NOA" address="0x00009888" value="0x11860007" />
+        <register type="NOA" address="0x00009888" value="0x01870C40" />
+        <register type="NOA" address="0x00009888" value="0x17880000" />
+        <register type="NOA" address="0x00009888" value="0x022F4000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C0040" />
+        <register type="NOA" address="0x00009888" value="0x0C0D8000" />
+        <register type="NOA" address="0x00009888" value="0x040D4000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x020E5400" />
+        <register type="NOA" address="0x00009888" value="0x000E0000" />
+        <register type="NOA" address="0x00009888" value="0x080F0040" />
+        <register type="NOA" address="0x00009888" value="0x000F0000" />
+        <register type="NOA" address="0x00009888" value="0x100F0000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0040" />
+        <register type="NOA" address="0x00009888" value="0x0C2C8000" />
+        <register type="NOA" address="0x00009888" value="0x06104000" />
+        <register type="NOA" address="0x00009888" value="0x06110012" />
+        <register type="NOA" address="0x00009888" value="0x06131000" />
+        <register type="NOA" address="0x00009888" value="0x01898000" />
+        <register type="NOA" address="0x00009888" value="0x0D890100" />
+        <register type="NOA" address="0x00009888" value="0x03898000" />
+        <register type="NOA" address="0x00009888" value="0x09808000" />
+        <register type="NOA" address="0x00009888" value="0x0B808000" />
+        <register type="NOA" address="0x00009888" value="0x0380C000" />
+        <register type="NOA" address="0x00009888" value="0x0F8A0075" />
+        <register type="NOA" address="0x00009888" value="0x1D8A0000" />
+        <register type="NOA" address="0x00009888" value="0x118A8000" />
+        <register type="NOA" address="0x00009888" value="0x1B8A4000" />
+        <register type="NOA" address="0x00009888" value="0x138A8000" />
+        <register type="NOA" address="0x00009888" value="0x1D81A000" />
+        <register type="NOA" address="0x00009888" value="0x15818000" />
+        <register type="NOA" address="0x00009888" value="0x17818000" />
+        <register type="NOA" address="0x00009888" value="0x0B820030" />
+        <register type="NOA" address="0x00009888" value="0x07828000" />
+        <register type="NOA" address="0x00009888" value="0x0D824000" />
+        <register type="NOA" address="0x00009888" value="0x0F828000" />
+        <register type="NOA" address="0x00009888" value="0x05824000" />
+        <register type="NOA" address="0x00009888" value="0x0D830003" />
+        <register type="NOA" address="0x00009888" value="0x0583000C" />
+        <register type="NOA" address="0x00009888" value="0x09830000" />
+        <register type="NOA" address="0x00009888" value="0x03838000" />
+        <register type="NOA" address="0x00009888" value="0x07838000" />
+        <register type="NOA" address="0x00009888" value="0x0B840980" />
+        <register type="NOA" address="0x00009888" value="0x03844D80" />
+        <register type="NOA" address="0x00009888" value="0x11840000" />
+        <register type="NOA" address="0x00009888" value="0x09848000" />
+        <register type="NOA" address="0x00009888" value="0x09850080" />
+        <register type="NOA" address="0x00009888" value="0x03850003" />
+        <register type="NOA" address="0x00009888" value="0x01850000" />
+        <register type="NOA" address="0x00009888" value="0x07860000" />
+        <register type="NOA" address="0x00009888" value="0x0F860400" />
+        <register type="NOA" address="0x00009888" value="0x09870032" />
+        <register type="NOA" address="0x00009888" value="0x01888052" />
+        <register type="NOA" address="0x00009888" value="0x11880000" />
+        <register type="NOA" address="0x00009888" value="0x09884000" />
+        <register type="NOA" address="0x00009888" value="0x1B931001" />
+        <register type="NOA" address="0x00009888" value="0x1D930001" />
+        <register type="NOA" address="0x00009888" value="0x19934000" />
+        <register type="NOA" address="0x00009888" value="0x1B958000" />
+        <register type="NOA" address="0x00009888" value="0x1D950094" />
+        <register type="NOA" address="0x00009888" value="0x19958000" />
+        <register type="NOA" address="0x00009888" value="0x09E58000" />
+        <register type="NOA" address="0x00009888" value="0x0BE58000" />
+        <register type="NOA" address="0x00009888" value="0x03E5C000" />
+        <register type="NOA" address="0x00009888" value="0x0592C000" />
+        <register type="NOA" address="0x00009888" value="0x0B928000" />
+        <register type="NOA" address="0x00009888" value="0x0D924000" />
+        <register type="NOA" address="0x00009888" value="0x0F924000" />
+        <register type="NOA" address="0x00009888" value="0x11928000" />
+        <register type="NOA" address="0x00009888" value="0x1392C000" />
+        <register type="NOA" address="0x00009888" value="0x09924000" />
+        <register type="NOA" address="0x00009888" value="0x01985000" />
+        <register type="NOA" address="0x00009888" value="0x07988000" />
+        <register type="NOA" address="0x00009888" value="0x09981000" />
+        <register type="NOA" address="0x00009888" value="0x0B982000" />
+        <register type="NOA" address="0x00009888" value="0x0D982000" />
+        <register type="NOA" address="0x00009888" value="0x0F989000" />
+        <register type="NOA" address="0x00009888" value="0x05982000" />
+        <register type="NOA" address="0x00009888" value="0x13904000" />
+        <register type="NOA" address="0x00009888" value="0x21904000" />
+        <register type="NOA" address="0x00009888" value="0x23904000" />
+        <register type="NOA" address="0x00009888" value="0x25908000" />
+        <register type="NOA" address="0x00009888" value="0x27904000" />
+        <register type="NOA" address="0x00009888" value="0x29908000" />
+        <register type="NOA" address="0x00009888" value="0x2B904000" />
+        <register type="NOA" address="0x00009888" value="0x2F904000" />
+        <register type="NOA" address="0x00009888" value="0x31904000" />
+        <register type="NOA" address="0x00009888" value="0x15904000" />
+        <register type="NOA" address="0x00009888" value="0x17908000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B904000" />
+        <register type="NOA" address="0x00009888" value="0x1190C080" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900440" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900400" />
+        <register type="NOA" address="0x00009888" value="0x47900C21" />
+        <register type="NOA" address="0x00009888" value="0x57900400" />
+        <register type="NOA" address="0x00009888" value="0x49900042" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900024" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x43900841" />
+        <register type="NOA" address="0x00009888" value="0x53900400" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007FFEA" />
+        <register type="OA" address="0x00002774" value="0x00007FFC" />
+        <register type="OA" address="0x00002778" value="0x0007AFFA" />
+        <register type="OA" address="0x0000277C" value="0x0000F5FD" />
+        <register type="OA" address="0x00002780" value="0x00079FFA" />
+        <register type="OA" address="0x00002784" value="0x0000F3FB" />
+        <register type="OA" address="0x00002788" value="0x0007BF7A" />
+        <register type="OA" address="0x0000278C" value="0x0000F7E7" />
+        <register type="OA" address="0x00002790" value="0x0007FEFA" />
+        <register type="OA" address="0x00002794" value="0x0000F7CF" />
+        <register type="OA" address="0x00002798" value="0x00077FFA" />
+        <register type="OA" address="0x0000279C" value="0x0000EFDF" />
+        <register type="OA" address="0x000027A0" value="0x0006FFFA" />
+        <register type="OA" address="0x000027A4" value="0x0000CFBF" />
+        <register type="OA" address="0x000027A8" value="0x0003FFFA" />
+        <register type="OA" address="0x000027AC" value="0x00005F7F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00015014" />
+        <register type="FLEX" address="0x0000E658" value="0x00025024" />
+        <register type="FLEX" address="0x0000E758" value="0x00035034" />
+        <register type="FLEX" address="0x0000E45C" value="0x00045044" />
+        <register type="FLEX" address="0x0000E55C" value="0x00055054" />
+        <register type="FLEX" address="0x0000E65C" value="0x00065064" />
+    </register_config>
+  </set>
+
+  <set name="Memory Reads Distribution Gen9"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="memory_reads"
+       hw_config_guid="82096a90-e2fa-4f38-ac14-562b2496933a"
+       chipset="CFLGT2"
+       symbol_name="MemoryReads"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiL3Bank0Reads"
+             description="The total number of GTI memory reads from L3 Bank 0 (L3 Cache misses)."
+             data_type="uint64"
+             equation="C 4 READ"
+             underscore_name="gti_l3_bank0_reads"
+             units="messages"
+             symbol_name="GtiL3Bank0Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="GtiRingAccesses"
+             description="The total number of all accesses from GTI to the ring."
+             data_type="uint64"
+             equation="C 3 READ 2 UMUL"
+             underscore_name="gti_ring_accesses"
+             units="messages"
+             symbol_name="GtiRingAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="GtiL3Bank3Reads"
+             description="The total number of GTI memory reads from L3 Bank 3 (L3 Cache misses)."
+             data_type="uint64"
+             equation="C 7 READ"
+             underscore_name="gti_l3_bank3_reads"
+             units="messages"
+             symbol_name="GtiL3Bank3Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="GtiRsMemoryReads"
+             description="The total number of GTI memory reads from Resource Streamer."
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="gti_rs_memory_reads"
+             units="messages"
+             symbol_name="GtiRsMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Resource Streamer"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GtiHizMemoryReads"
+             description="The total number of GTI memory reads from Hierarchical Depth Cache (Hi-Depth Cache misses)."
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="gti_hiz_memory_reads"
+             units="messages"
+             symbol_name="GtiHizMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="GtiRccMemoryReads"
+             description="The total number of GTI memory reads from Render Color Cache (Render Color Cache misses)."
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="gti_rcc_memory_reads"
+             units="messages"
+             symbol_name="GtiRccMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Color Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiL3Bank1Reads"
+             description="The total number of GTI memory reads from L3 Bank 1 (L3 Cache misses)."
+             data_type="uint64"
+             equation="C 5 READ"
+             underscore_name="gti_l3_bank1_reads"
+             units="messages"
+             symbol_name="GtiL3Bank1Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiCmdStreamerMemoryReads"
+             description="The total number of GTI memory reads from Command Streamer."
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="gti_cmd_streamer_memory_reads"
+             units="messages"
+             symbol_name="GtiCmdStreamerMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Command Streamer"
+             />
+    <counter name="GtiL3Bank2Reads"
+             description="The total number of GTI memory reads from L3 Bank 2 (L3 Cache misses)."
+             data_type="uint64"
+             equation="C 6 READ"
+             underscore_name="gti_l3_bank2_reads"
+             units="messages"
+             symbol_name="GtiL3Bank2Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiMemoryReads"
+             description="The total number of GTI memory reads."
+             data_type="uint64"
+             equation="C 0 READ"
+             underscore_name="gti_memory_reads"
+             units="messages"
+             symbol_name="GtiMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="GtiRczMemoryReads"
+             description="The total number of GTI memory reads from Render Depth Cache (Render Depth Cache misses)."
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="gti_rcz_memory_reads"
+             units="messages"
+             symbol_name="GtiRczMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="GtiMscMemoryReads"
+             description="The total number of GTI memory reads from Multisampling Color Cache (Multisampling Color Cache misses)."
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="gti_msc_memory_reads"
+             units="messages"
+             symbol_name="GtiMscMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Color Cache"
+             />
+    <counter name="GtiVfMemoryReads"
+             description="The total number of GTI memory reads from Vertex Fetch."
+             data_type="uint64"
+             equation="B 1 READ"
+             underscore_name="gti_vf_memory_reads"
+             units="messages"
+             symbol_name="GtiVfMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Vertex Fetch"
+             />
+    <counter name="GtiStcMemoryReads"
+             description="The total number of GTI memory reads from Stencil Cache (Stencil Cache misses)."
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="gti_stc_memory_reads"
+             units="messages"
+             symbol_name="GtiStcMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiL3Reads"
+             description="The total number of GTI memory reads from L3 (L3 Cache misses)."
+             data_type="uint64"
+             equation="$GtiL3Bank0Reads $GtiL3Bank1Reads $GtiL3Bank2Reads $GtiL3Bank3Reads UADD UADD UADD"
+             underscore_name="gti_l3_reads"
+             units="messages"
+             symbol_name="GtiL3Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x11810C00" />
+        <register type="NOA" address="0x00009888" value="0x1381001A" />
+        <register type="NOA" address="0x00009888" value="0x37906800" />
+        <register type="NOA" address="0x00009888" value="0x3F900064" />
+        <register type="NOA" address="0x00009888" value="0x03811300" />
+        <register type="NOA" address="0x00009888" value="0x05811B12" />
+        <register type="NOA" address="0x00009888" value="0x0781001A" />
+        <register type="NOA" address="0x00009888" value="0x1F810000" />
+        <register type="NOA" address="0x00009888" value="0x17810000" />
+        <register type="NOA" address="0x00009888" value="0x19810000" />
+        <register type="NOA" address="0x00009888" value="0x1B810000" />
+        <register type="NOA" address="0x00009888" value="0x1D810000" />
+        <register type="NOA" address="0x00009888" value="0x1B930055" />
+        <register type="NOA" address="0x00009888" value="0x03E58000" />
+        <register type="NOA" address="0x00009888" value="0x05E5C000" />
+        <register type="NOA" address="0x00009888" value="0x07E54000" />
+        <register type="NOA" address="0x00009888" value="0x13900150" />
+        <register type="NOA" address="0x00009888" value="0x21900151" />
+        <register type="NOA" address="0x00009888" value="0x23900152" />
+        <register type="NOA" address="0x00009888" value="0x25900153" />
+        <register type="NOA" address="0x00009888" value="0x27900154" />
+        <register type="NOA" address="0x00009888" value="0x29900155" />
+        <register type="NOA" address="0x00009888" value="0x2B900156" />
+        <register type="NOA" address="0x00009888" value="0x2D900157" />
+        <register type="NOA" address="0x00009888" value="0x2F90015F" />
+        <register type="NOA" address="0x00009888" value="0x31900105" />
+        <register type="NOA" address="0x00009888" value="0x15900103" />
+        <register type="NOA" address="0x00009888" value="0x17900101" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B908000" />
+        <register type="NOA" address="0x00009888" value="0x1D908000" />
+        <register type="NOA" address="0x00009888" value="0x1F908000" />
+        <register type="NOA" address="0x00009888" value="0x11900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900C60" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900C00" />
+        <register type="NOA" address="0x00009888" value="0x47900C63" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900C63" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900063" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x43900003" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x0000272C" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002728" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x0000271C" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002718" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x0000274C" value="0x86543210" />
+        <register type="OA" address="0x00002748" value="0x86543210" />
+        <register type="OA" address="0x00002744" value="0x00006667" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x0000275C" value="0x86543210" />
+        <register type="OA" address="0x00002758" value="0x86543210" />
+        <register type="OA" address="0x00002754" value="0x00006465" />
+        <register type="OA" address="0x00002750" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007F81A" />
+        <register type="OA" address="0x00002774" value="0x0000FE00" />
+        <register type="OA" address="0x00002778" value="0x0007F82A" />
+        <register type="OA" address="0x0000277C" value="0x0000FE00" />
+        <register type="OA" address="0x00002780" value="0x0007F872" />
+        <register type="OA" address="0x00002784" value="0x0000FE00" />
+        <register type="OA" address="0x00002788" value="0x0007F8BA" />
+        <register type="OA" address="0x0000278C" value="0x0000FE00" />
+        <register type="OA" address="0x00002790" value="0x0007F87A" />
+        <register type="OA" address="0x00002794" value="0x0000FE00" />
+        <register type="OA" address="0x00002798" value="0x0007F8EA" />
+        <register type="OA" address="0x0000279C" value="0x0000FE00" />
+        <register type="OA" address="0x000027A0" value="0x0007F8E2" />
+        <register type="OA" address="0x000027A4" value="0x0000FE00" />
+        <register type="OA" address="0x000027A8" value="0x0007F8F2" />
+        <register type="OA" address="0x000027AC" value="0x0000FE00" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00015014" />
+        <register type="FLEX" address="0x0000E658" value="0x00025024" />
+        <register type="FLEX" address="0x0000E758" value="0x00035034" />
+        <register type="FLEX" address="0x0000E45C" value="0x00045044" />
+        <register type="FLEX" address="0x0000E55C" value="0x00055054" />
+        <register type="FLEX" address="0x0000E65C" value="0x00065064" />
+    </register_config>
+  </set>
+
+  <set name="Memory Writes Distribution Gen9"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="memory_writes"
+       hw_config_guid="9f638880-02e9-4a8d-896a-7670a3bf0d35"
+       chipset="CFLGT2"
+       symbol_name="MemoryWrites"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiMemoryWrites"
+             description="The total number of GTI memory writes."
+             data_type="uint64"
+             equation="C 0 READ"
+             underscore_name="gti_memory_writes"
+             units="messages"
+             symbol_name="GtiMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="GtiRingAccesses"
+             description="The total number of all GTI accesses to the ring."
+             data_type="uint64"
+             equation="C 3 READ 2 UMUL"
+             underscore_name="gti_ring_accesses"
+             units="messages"
+             symbol_name="GtiRingAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="GtiMscMemoryWrites"
+             description="The total number of GTI memory writes from Multisampling Color Cache (Multisampling Color Cache invalidations)."
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="gti_msc_memory_writes"
+             units="messages"
+             symbol_name="GtiMscMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Color Cache"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="GtiCmdStreamerMemoryWrites"
+             description="The total number of GTI memory writes from Command Streamer."
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="gti_cmd_streamer_memory_writes"
+             units="messages"
+             symbol_name="GtiCmdStreamerMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Command Streamer"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GtiL3Bank0Writes"
+             description="The total number of GTI memory writes from L3 Bank 0 (L3 Bank 0 invalidations)."
+             data_type="uint64"
+             equation="C 4 READ"
+             underscore_name="gti_l3_bank0_writes"
+             units="messages"
+             symbol_name="GtiL3Bank0Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiL3Bank1Writes"
+             description="The total number of GTI memory writes from L3 Bank 1 (L3 Bank 1 invalidations)."
+             data_type="uint64"
+             equation="C 5 READ"
+             underscore_name="gti_l3_bank1_writes"
+             units="messages"
+             symbol_name="GtiL3Bank1Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiL3Bank2Writes"
+             description="The total number of GTI memory writes from L3 Bank 2 (L3 Bank 2 invalidations)."
+             data_type="uint64"
+             equation="C 6 READ"
+             underscore_name="gti_l3_bank2_writes"
+             units="messages"
+             symbol_name="GtiL3Bank2Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiL3Bank3Writes"
+             description="The total number of GTI memory writes from L3 Bank 3 (L3 Bank 3 invalidations)."
+             data_type="uint64"
+             equation="C 7 READ"
+             underscore_name="gti_l3_bank3_writes"
+             units="messages"
+             symbol_name="GtiL3Bank3Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiL3Writes"
+             description="The total number of GTI memory writes from L3 (L3 invalidations)."
+             data_type="uint64"
+             equation="$GtiL3Bank0Writes $GtiL3Bank1Writes $GtiL3Bank2Writes $GtiL3Bank3Writes UADD UADD UADD"
+             underscore_name="gti_l3_writes"
+             units="messages"
+             symbol_name="GtiL3Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiRccMemoryWrites"
+             description="The total number of GTI memory writes from Render Color Cache (Render Color Cache invalidations)."
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="gti_rcc_memory_writes"
+             units="messages"
+             symbol_name="GtiRccMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Color Cache"
+             />
+    <counter name="GtiSoMemoryWrites"
+             description="The total number of GTI memory writes from Stream Output."
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="gti_so_memory_writes"
+             units="messages"
+             symbol_name="GtiSoMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Stream Output"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiStcMemoryWrites"
+             description="The total number of GTI memory writes from Stencil Cache."
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="gti_stc_memory_writes"
+             units="messages"
+             symbol_name="GtiStcMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="GtiRczMemoryWrites"
+             description="The total number of GTI memory writes from Render Depth Cache."
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="gti_rcz_memory_writes"
+             units="messages"
+             symbol_name="GtiRczMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="GtiHizMemoryWrites"
+             description="The total number of GTI memory writes from Hierarchical Depth Cache."
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="gti_hiz_memory_writes"
+             units="messages"
+             symbol_name="GtiHizMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x11810C00" />
+        <register type="NOA" address="0x00009888" value="0x1381001A" />
+        <register type="NOA" address="0x00009888" value="0x37906800" />
+        <register type="NOA" address="0x00009888" value="0x3F901000" />
+        <register type="NOA" address="0x00009888" value="0x03811300" />
+        <register type="NOA" address="0x00009888" value="0x05811B12" />
+        <register type="NOA" address="0x00009888" value="0x0781001A" />
+        <register type="NOA" address="0x00009888" value="0x1F810000" />
+        <register type="NOA" address="0x00009888" value="0x17810000" />
+        <register type="NOA" address="0x00009888" value="0x19810000" />
+        <register type="NOA" address="0x00009888" value="0x1B810000" />
+        <register type="NOA" address="0x00009888" value="0x1D810000" />
+        <register type="NOA" address="0x00009888" value="0x1B930055" />
+        <register type="NOA" address="0x00009888" value="0x03E58000" />
+        <register type="NOA" address="0x00009888" value="0x05E5C000" />
+        <register type="NOA" address="0x00009888" value="0x07E54000" />
+        <register type="NOA" address="0x00009888" value="0x13900160" />
+        <register type="NOA" address="0x00009888" value="0x21900161" />
+        <register type="NOA" address="0x00009888" value="0x23900162" />
+        <register type="NOA" address="0x00009888" value="0x25900163" />
+        <register type="NOA" address="0x00009888" value="0x27900164" />
+        <register type="NOA" address="0x00009888" value="0x29900165" />
+        <register type="NOA" address="0x00009888" value="0x2B900166" />
+        <register type="NOA" address="0x00009888" value="0x2D900167" />
+        <register type="NOA" address="0x00009888" value="0x2F900150" />
+        <register type="NOA" address="0x00009888" value="0x31900105" />
+        <register type="NOA" address="0x00009888" value="0x15900103" />
+        <register type="NOA" address="0x00009888" value="0x17900101" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B908000" />
+        <register type="NOA" address="0x00009888" value="0x1D908000" />
+        <register type="NOA" address="0x00009888" value="0x1F908000" />
+        <register type="NOA" address="0x00009888" value="0x11900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900C60" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900C00" />
+        <register type="NOA" address="0x00009888" value="0x47900C63" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900C63" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900063" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x43900003" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x0000272C" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002728" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x0000271C" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002718" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x0000274C" value="0x86543210" />
+        <register type="OA" address="0x00002748" value="0x86543210" />
+        <register type="OA" address="0x00002744" value="0x00006667" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x0000275C" value="0x86543210" />
+        <register type="OA" address="0x00002758" value="0x86543210" />
+        <register type="OA" address="0x00002754" value="0x00006465" />
+        <register type="OA" address="0x00002750" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007F81A" />
+        <register type="OA" address="0x00002774" value="0x0000FE00" />
+        <register type="OA" address="0x00002778" value="0x0007F82A" />
+        <register type="OA" address="0x0000277C" value="0x0000FE00" />
+        <register type="OA" address="0x00002780" value="0x0007F822" />
+        <register type="OA" address="0x00002784" value="0x0000FE00" />
+        <register type="OA" address="0x00002788" value="0x0007F8BA" />
+        <register type="OA" address="0x0000278C" value="0x0000FE00" />
+        <register type="OA" address="0x00002790" value="0x0007F87A" />
+        <register type="OA" address="0x00002794" value="0x0000FE00" />
+        <register type="OA" address="0x00002798" value="0x0007F8EA" />
+        <register type="OA" address="0x0000279C" value="0x0000FE00" />
+        <register type="OA" address="0x000027A0" value="0x0007F8E2" />
+        <register type="OA" address="0x000027A4" value="0x0000FE00" />
+        <register type="OA" address="0x000027A8" value="0x0007F8F2" />
+        <register type="OA" address="0x000027AC" value="0x0000FE00" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00015014" />
+        <register type="FLEX" address="0x0000E658" value="0x00025024" />
+        <register type="FLEX" address="0x0000E758" value="0x00035034" />
+        <register type="FLEX" address="0x0000E45C" value="0x00045044" />
+        <register type="FLEX" address="0x0000E55C" value="0x00055054" />
+        <register type="FLEX" address="0x0000E65C" value="0x00065064" />
+    </register_config>
+  </set>
+
+  <set name="Compute Metrics Extended Gen9"
+       mdapi_supported_apis="VK OGL4 OCL IO BB"
+       underscore_name="compute_extended"
+       hw_config_guid="8d4ad934-7c16-43d5-845a-51067a4c8e2f"
+       chipset="CFLGT2"
+       symbol_name="ComputeExtended"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu0_active"
+             units="percent"
+             symbol_name="Fpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active"
+             units="percent"
+             symbol_name="Fpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU AVG IPC Rate"
+             description="The average rate of IPC calculated for 2 FPU pipelines."
+             data_type="float"
+             max_equation="2"
+             equation="A 9 READ  A 10 READ  A 11 READ UADD  A 9 READ USUB FDIV 1 FADD"
+             underscore_name="eu_avg_ipc_rate"
+             units="number"
+             symbol_name="EuAvgIpcRate"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Typed Writes 0"
+             description="The subslice 0 typed writes."
+             data_type="uint64"
+             equation="C 0 READ"
+             underscore_name="typed_writes0"
+             units="messages"
+             symbol_name="TypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuTypedAtomics0"
+             description="The subslice 0 EU Typed Atomics subslice 0."
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="eu_typed_atomics0"
+             units="messages"
+             symbol_name="EuTypedAtomics0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Typed Atomics 0"
+             description="The subslice 0 typed atomics."
+             data_type="uint64"
+             equation="C 4 READ"
+             underscore_name="typed_atomics0"
+             units="messages"
+             symbol_name="TypedAtomics0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="TypedAtomicsPerCacheLine"
+             description="The ratio of EU typed atomics requests to L3 cache line writes."
+             data_type="float"
+             equation="$EuTypedAtomics0 $TypedAtomics0 FDIV"
+             underscore_name="typed_atomics_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="TypedAtomicsPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuUntypedReads0"
+             description="The subslice 0 EU Untyped Reads subslice 0."
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="eu_untyped_reads0"
+             units="messages"
+             symbol_name="EuUntypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Untyped Writes 0"
+             description="The subslice 0 untyped writes (including SLM writes)."
+             data_type="uint64"
+             equation="C 1 READ"
+             underscore_name="untyped_writes0"
+             units="messages"
+             symbol_name="UntypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuUntypedAtomics0"
+             description="The subslice 0 EU Untyped Atomics subslice 0."
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="eu_untyped_atomics0"
+             units="messages"
+             symbol_name="EuUntypedAtomics0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuUntypedWrites0"
+             description="The subslice 0 EU Untyped Writes subslice 0."
+             data_type="uint64"
+             equation="B 1 READ"
+             underscore_name="eu_untyped_writes0"
+             units="messages"
+             symbol_name="EuUntypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuA64UntypedWrites0"
+             description="The subslice 0 EU A64 Untyped Writes subslice 0."
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="eu_a64_untyped_writes0"
+             units="messages"
+             symbol_name="EuA64UntypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="UntypedWritesPerCacheLine"
+             description="The ratio of EU untyped write requests to L3 cache line writes."
+             data_type="float"
+             equation="$EuUntypedWrites0 $EuA64UntypedWrites0 UADD $UntypedWrites0 FDIV"
+             underscore_name="untyped_writes_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="UntypedWritesPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EuTypedWrites0"
+             description="The subslice 0 EU Typed Writes subslice 0."
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="eu_typed_writes0"
+             units="messages"
+             symbol_name="EuTypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="TypedWritesPerCacheLine"
+             description="The ratio of EU typed write requests to L3 cache line writes."
+             data_type="float"
+             equation="$EuTypedWrites0 $TypedWrites0 FDIV"
+             underscore_name="typed_writes_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="TypedWritesPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Typed Reads 0"
+             description="The subslice 0 typed reads."
+             data_type="uint64"
+             equation="C 2 READ"
+             underscore_name="typed_reads0"
+             units="messages"
+             symbol_name="TypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Untyped Reads 0"
+             description="The subslice 0 untyped reads (including SLM reads)."
+             data_type="uint64"
+             equation="C 3 READ"
+             underscore_name="untyped_reads0"
+             units="messages"
+             symbol_name="UntypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuA64UntypedReads0"
+             description="The subslice 0 EU A64 Untyped Reads subslice 0."
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="eu_a64_untyped_reads0"
+             units="messages"
+             symbol_name="EuA64UntypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EU Thread Occupancy"
+             description="The percentage of time in which hardware threads occupied EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ 8 UMUL $EuCoresTotalCount UDIV $EuThreadsCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_thread_occupancy"
+             units="percent"
+             symbol_name="EuThreadOccupancy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EuTypedReads0"
+             description="The subslice 0 EU Typed Reads subslice 0."
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="eu_typed_reads0"
+             units="messages"
+             symbol_name="EuTypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="UntypedReadsPerCacheLine"
+             description="The ratio of EU untyped read requests to L3 cache line reads."
+             data_type="float"
+             equation="$EuUntypedReads0 $EuA64UntypedReads0 UADD $UntypedReads0 FDIV"
+             underscore_name="untyped_reads_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="UntypedReadsPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="TypedReadsPerCacheLine"
+             description="The ratio of EU typed read requests to L3 cache line reads."
+             data_type="float"
+             equation="$EuTypedReads0 $TypedReads0 FDIV"
+             underscore_name="typed_reads_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="TypedReadsPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="EU Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_send_active"
+             units="percent"
+             symbol_name="EuSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x106C00E0" />
+        <register type="NOA" address="0x00009888" value="0x141C8160" />
+        <register type="NOA" address="0x00009888" value="0x161C8015" />
+        <register type="NOA" address="0x00009888" value="0x181C0120" />
+        <register type="NOA" address="0x00009888" value="0x004E8000" />
+        <register type="NOA" address="0x00009888" value="0x0E4E8000" />
+        <register type="NOA" address="0x00009888" value="0x184E8000" />
+        <register type="NOA" address="0x00009888" value="0x1A4EAAA0" />
+        <register type="NOA" address="0x00009888" value="0x1C4E0002" />
+        <register type="NOA" address="0x00009888" value="0x024E8000" />
+        <register type="NOA" address="0x00009888" value="0x044E8000" />
+        <register type="NOA" address="0x00009888" value="0x064E8000" />
+        <register type="NOA" address="0x00009888" value="0x084E8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4E8000" />
+        <register type="NOA" address="0x00009888" value="0x0E6C0B01" />
+        <register type="NOA" address="0x00009888" value="0x006C0200" />
+        <register type="NOA" address="0x00009888" value="0x026C000C" />
+        <register type="NOA" address="0x00009888" value="0x1C6C0000" />
+        <register type="NOA" address="0x00009888" value="0x1E6C0000" />
+        <register type="NOA" address="0x00009888" value="0x1A6C0000" />
+        <register type="NOA" address="0x00009888" value="0x0E1BC000" />
+        <register type="NOA" address="0x00009888" value="0x001B8000" />
+        <register type="NOA" address="0x00009888" value="0x021BC000" />
+        <register type="NOA" address="0x00009888" value="0x001C0041" />
+        <register type="NOA" address="0x00009888" value="0x061C4200" />
+        <register type="NOA" address="0x00009888" value="0x081C4443" />
+        <register type="NOA" address="0x00009888" value="0x0A1C4645" />
+        <register type="NOA" address="0x00009888" value="0x0C1C7647" />
+        <register type="NOA" address="0x00009888" value="0x041C7357" />
+        <register type="NOA" address="0x00009888" value="0x1C1C0030" />
+        <register type="NOA" address="0x00009888" value="0x101C0000" />
+        <register type="NOA" address="0x00009888" value="0x1A1C0000" />
+        <register type="NOA" address="0x00009888" value="0x121C8000" />
+        <register type="NOA" address="0x00009888" value="0x004C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4CAA2A" />
+        <register type="NOA" address="0x00009888" value="0x0C4C02AA" />
+        <register type="NOA" address="0x00009888" value="0x084CA000" />
+        <register type="NOA" address="0x00009888" value="0x000DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D8000" />
+        <register type="NOA" address="0x00009888" value="0x080DA000" />
+        <register type="NOA" address="0x00009888" value="0x0A0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0E0DA000" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F5400" />
+        <register type="NOA" address="0x00009888" value="0x0E0F5515" />
+        <register type="NOA" address="0x00009888" value="0x100F0155" />
+        <register type="NOA" address="0x00009888" value="0x002C8000" />
+        <register type="NOA" address="0x00009888" value="0x0E2C8000" />
+        <register type="NOA" address="0x00009888" value="0x162CAA00" />
+        <register type="NOA" address="0x00009888" value="0x182C00AA" />
+        <register type="NOA" address="0x00009888" value="0x022C8000" />
+        <register type="NOA" address="0x00009888" value="0x042C8000" />
+        <register type="NOA" address="0x00009888" value="0x062C8000" />
+        <register type="NOA" address="0x00009888" value="0x082C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x11907FFF" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900040" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900802" />
+        <register type="NOA" address="0x00009888" value="0x47900842" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900842" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900000" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x43900800" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007FC2A" />
+        <register type="OA" address="0x00002774" value="0x0000BF00" />
+        <register type="OA" address="0x00002778" value="0x0007FC6A" />
+        <register type="OA" address="0x0000277C" value="0x0000BF00" />
+        <register type="OA" address="0x00002780" value="0x0007FC92" />
+        <register type="OA" address="0x00002784" value="0x0000BF00" />
+        <register type="OA" address="0x00002788" value="0x0007FCA2" />
+        <register type="OA" address="0x0000278C" value="0x0000BF00" />
+        <register type="OA" address="0x00002790" value="0x0007FC32" />
+        <register type="OA" address="0x00002794" value="0x0000BF00" />
+        <register type="OA" address="0x00002798" value="0x0007FC9A" />
+        <register type="OA" address="0x0000279C" value="0x0000BF00" />
+        <register type="OA" address="0x000027A0" value="0x0007FE6A" />
+        <register type="OA" address="0x000027A4" value="0x0000BF00" />
+        <register type="OA" address="0x000027A8" value="0x0007FE7A" />
+        <register type="OA" address="0x000027AC" value="0x0000BF00" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00000003" />
+        <register type="FLEX" address="0x0000E658" value="0x00002001" />
+        <register type="FLEX" address="0x0000E758" value="0x00778008" />
+        <register type="FLEX" address="0x0000E45C" value="0x00088078" />
+        <register type="FLEX" address="0x0000E55C" value="0x00808708" />
+        <register type="FLEX" address="0x0000E65C" value="0x00A08908" />
+    </register_config>
+  </set>
+
+  <set name="Compute Metrics L3 Cache Gen9"
+       mdapi_supported_apis="VK OGL4 OCL IO BB"
+       underscore_name="compute_l3_cache"
+       hw_config_guid="4389cf07-1424-4963-b2d2-64fcec75406d"
+       chipset="CFLGT2"
+       symbol_name="ComputeL3Cache"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Bank 03 Accesses"
+             description="The total number of accesses to L3 Bank 03."
+             data_type="uint64"
+             equation="B 3 READ 2 UMUL"
+             underscore_name="l3_bank03_accesses"
+             units="messages"
+             symbol_name="L3Bank03Accesses"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="L3 Accesses"
+             description="The total number of L3 accesses from all entities."
+             data_type="uint64"
+             equation="C 0 READ C 1 READ B 2 READ B 3 READ UADD UADD UADD 2 UMUL"
+             underscore_name="l3_accesses"
+             units="messages"
+             symbol_name="L3Accesses"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Sampler Throughput"
+             description="The total number of GPU memory bytes transferred between samplers and L3 caches."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 29 READ 64 UMUL"
+             underscore_name="l3_sampler_throughput"
+             units="bytes"
+             symbol_name="L3SamplerThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Sampler"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu0_active"
+             units="percent"
+             symbol_name="Fpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active"
+             units="percent"
+             symbol_name="Fpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU AVG IPC Rate"
+             description="The average rate of IPC calculated for 2 FPU pipelines."
+             data_type="float"
+             max_equation="2"
+             equation="A 9 READ  A 10 READ  A 11 READ UADD  A 9 READ USUB FDIV 1 FADD"
+             underscore_name="eu_avg_ipc_rate"
+             units="number"
+             symbol_name="EuAvgIpcRate"
+             semantic_type="ratio"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Binary Instruction"
+             description="The percentage of time in which execution units were actively processing binary instructions on FPU0."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_binary_fpu0_instruction"
+             units="percent"
+             symbol_name="EuBinaryFpu0Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="EU FPU0 Hybrid Instruction"
+             description="The percentage of time in which execution units were actively processing hybrid instructions on FPU0."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_hybrid_fpu0_instruction"
+             units="percent"
+             symbol_name="EuHybridFpu0Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Misses"
+             description="The total number of L3 misses."
+             data_type="uint64"
+             equation="C 4 READ C 5 READ UADD"
+             underscore_name="l3_misses"
+             units="messages"
+             symbol_name="L3Misses"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/TAG"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="L3 Bank 00 Accesses"
+             description="The total number of accesses to L3 Bank 00."
+             data_type="uint64"
+             equation="C 0 READ 2 UMUL"
+             underscore_name="l3_bank00_accesses"
+             units="messages"
+             symbol_name="L3Bank00Accesses"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="EU FPU0 Move Instruction"
+             description="The percentage of time in which execution units were actively processing move instructions on FPU0."
+             data_type="float"
+             max_equation="100"
+             equation="A 19 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_move_fpu0_instruction"
+             units="percent"
+             symbol_name="EuMoveFpu0Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU FPU1 Hybrid Instruction"
+             description="The percentage of time in which execution units were actively processing hybrid instructions on FPU1."
+             data_type="float"
+             max_equation="100"
+             equation="A 14 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_hybrid_fpu1_instruction"
+             units="percent"
+             symbol_name="EuHybridFpu1Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Read Throughput"
+             description="The total number of GPU memory bytes read from GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="C 6 READ 64 UMUL"
+             underscore_name="gti_read_throughput"
+             units="bytes"
+             symbol_name="GtiReadThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI L3 Throughput"
+             description="The total number of GPU memory bytes transferred between L3 caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 4 READ C 5 READ UADD 64 UMUL"
+             underscore_name="gti_l3_throughput"
+             units="bytes"
+             symbol_name="GtiL3Throughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Bank 00 IC Accesses"
+             description="The total number of accesses to L3 Bank 00 from IC cache."
+             data_type="uint64"
+             equation="B 0 READ B 1 READ UADD 2 UMUL $L3Bank00Accesses UMIN"
+             underscore_name="l3_bank00_ic_accesses"
+             units="messages"
+             symbol_name="L3Bank00IcAccesses"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3/IC"
+             />
+    <counter name="L3 Bank 00 IC Hits"
+             description="The total number of hits in L3 Bank 00 from IC cache."
+             data_type="uint64"
+             equation="B 1 READ 2 UMUL $L3Bank00IcAccesses UMIN"
+             underscore_name="l3_bank00_ic_hits"
+             units="messages"
+             symbol_name="L3Bank00IcHits"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3/IC"
+             />
+    <counter name="Sampler Accesses"
+             description="The total number of messages send to samplers."
+             data_type="uint64"
+             equation="A 28 READ"
+             underscore_name="sampler_accesses"
+             units="messages"
+             symbol_name="SamplerAccesses"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler"
+             />
+    <counter name="L3 Bank 01 Accesses"
+             description="The total number of accesses to L3 Bank 01."
+             data_type="uint64"
+             equation="C 1 READ 2 UMUL"
+             underscore_name="l3_bank01_accesses"
+             units="messages"
+             symbol_name="L3Bank01Accesses"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Ternary Instruction"
+             description="The percentage of time in which execution units were actively processing ternary instructions on FPU0."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_ternary_fpu0_instruction"
+             units="percent"
+             symbol_name="EuTernaryFpu0Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU FPU1 Move Instruction"
+             description="The percentage of time in which execution units were actively processing move instructions on FPU1."
+             data_type="float"
+             max_equation="100"
+             equation="A 20 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_move_fpu1_instruction"
+             units="percent"
+             symbol_name="EuMoveFpu1Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="L3 Bank 02 Accesses"
+             description="The total number of accesses to L3 Bank 02."
+             data_type="uint64"
+             equation="B 2 READ 2 UMUL"
+             underscore_name="l3_bank02_accesses"
+             units="messages"
+             symbol_name="L3Bank02Accesses"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="L3 Total Throughput"
+             description="The total number of GPU memory bytes transferred via L3."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="$L3Accesses 64 UMUL"
+             underscore_name="l3_total_throughput"
+             units="bytes"
+             symbol_name="L3TotalThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Write Throughput"
+             description="The total number of GPU memory bytes written to GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 32 UMUL"
+             equation="C 7 READ 64 UMUL"
+             underscore_name="gti_write_throughput"
+             units="bytes"
+             symbol_name="GtiWriteThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="EU FPU1 Binary Instruction"
+             description="The percentage of time in which execution units were actively processing binary instructions on FPU1."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_binary_fpu1_instruction"
+             units="percent"
+             symbol_name="EuBinaryFpu1Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Ternary Instruction"
+             description="The percentage of time in which execution units were actively processing ternary instructions on FPU1."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_ternary_fpu1_instruction"
+             units="percent"
+             symbol_name="EuTernaryFpu1Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_send_active"
+             units="percent"
+             symbol_name="EuSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x166C0760" />
+        <register type="NOA" address="0x00009888" value="0x1593001E" />
+        <register type="NOA" address="0x00009888" value="0x3F900003" />
+        <register type="NOA" address="0x00009888" value="0x004E8000" />
+        <register type="NOA" address="0x00009888" value="0x0E4E8000" />
+        <register type="NOA" address="0x00009888" value="0x184E8000" />
+        <register type="NOA" address="0x00009888" value="0x1A4E8020" />
+        <register type="NOA" address="0x00009888" value="0x1C4E0002" />
+        <register type="NOA" address="0x00009888" value="0x006C0051" />
+        <register type="NOA" address="0x00009888" value="0x066C5000" />
+        <register type="NOA" address="0x00009888" value="0x086C5C5D" />
+        <register type="NOA" address="0x00009888" value="0x0E6C5E5F" />
+        <register type="NOA" address="0x00009888" value="0x106C0000" />
+        <register type="NOA" address="0x00009888" value="0x186C0000" />
+        <register type="NOA" address="0x00009888" value="0x1C6C0000" />
+        <register type="NOA" address="0x00009888" value="0x1E6C0000" />
+        <register type="NOA" address="0x00009888" value="0x001B4000" />
+        <register type="NOA" address="0x00009888" value="0x061B8000" />
+        <register type="NOA" address="0x00009888" value="0x081BC000" />
+        <register type="NOA" address="0x00009888" value="0x0E1BC000" />
+        <register type="NOA" address="0x00009888" value="0x101C8000" />
+        <register type="NOA" address="0x00009888" value="0x1A1CE000" />
+        <register type="NOA" address="0x00009888" value="0x1C1C0030" />
+        <register type="NOA" address="0x00009888" value="0x004C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C2A00" />
+        <register type="NOA" address="0x00009888" value="0x0C4C0280" />
+        <register type="NOA" address="0x00009888" value="0x000D2000" />
+        <register type="NOA" address="0x00009888" value="0x060D8000" />
+        <register type="NOA" address="0x00009888" value="0x080DA000" />
+        <register type="NOA" address="0x00009888" value="0x0E0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F0400" />
+        <register type="NOA" address="0x00009888" value="0x0E0F1500" />
+        <register type="NOA" address="0x00009888" value="0x100F0140" />
+        <register type="NOA" address="0x00009888" value="0x002C8000" />
+        <register type="NOA" address="0x00009888" value="0x0E2C8000" />
+        <register type="NOA" address="0x00009888" value="0x162C0A00" />
+        <register type="NOA" address="0x00009888" value="0x182C00A0" />
+        <register type="NOA" address="0x00009888" value="0x03933300" />
+        <register type="NOA" address="0x00009888" value="0x05930032" />
+        <register type="NOA" address="0x00009888" value="0x11930000" />
+        <register type="NOA" address="0x00009888" value="0x1B930000" />
+        <register type="NOA" address="0x00009888" value="0x1D900157" />
+        <register type="NOA" address="0x00009888" value="0x1F900158" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B908000" />
+        <register type="NOA" address="0x00009888" value="0x1190030F" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900000" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900021" />
+        <register type="NOA" address="0x00009888" value="0x47900000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900000" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x53904444" />
+        <register type="NOA" address="0x00009888" value="0x43900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x30800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x30800000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007FFFA" />
+        <register type="OA" address="0x00002774" value="0x0000FEFE" />
+        <register type="OA" address="0x00002778" value="0x0007FFFA" />
+        <register type="OA" address="0x0000277C" value="0x0000FEFD" />
+        <register type="OA" address="0x00002790" value="0x0007FFFA" />
+        <register type="OA" address="0x00002794" value="0x0000FBEF" />
+        <register type="OA" address="0x00002798" value="0x0007FFFA" />
+        <register type="OA" address="0x0000279C" value="0x0000FBDF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00000003" />
+        <register type="FLEX" address="0x0000E658" value="0x00002001" />
+        <register type="FLEX" address="0x0000E758" value="0x00101100" />
+        <register type="FLEX" address="0x0000E45C" value="0x00201200" />
+        <register type="FLEX" address="0x0000E55C" value="0x00301300" />
+        <register type="FLEX" address="0x0000E65C" value="0x00401400" />
+    </register_config>
+  </set>
+
+  <set name="Metric set HDCAndSF"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="hdc_and_sf"
+       hw_config_guid="ac544b3a-ff78-46ea-9808-ee6fef0978b4"
+       chipset="CFLGT2"
+       symbol_name="HDCAndSF"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="Polygon Data Ready"
+             description="The percentage of time in which geometry pipeline output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="poly_data_ready"
+             units="percent"
+             symbol_name="PolyDataReady"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe/Strip-Fans"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="HDC stalled by L3 (s0.ss1)"
+             description="Percentage of time when HDC has messges to L3, but it's stalled due to lack of credits (s0.ss1)"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ C 4 READ USUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader01_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader01AccessStalledOnL3"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="HDC stalled by L3 (s0.ss2)"
+             description="Percentage of time when HDC has messges to L3, but it's stalled due to lack of credits (s0.ss2)"
+             data_type="float"
+             max_equation="100"
+             equation="C 3 READ C 2 READ USUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader02_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader02AccessStalledOnL3"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="HDC stalled by L3 (s0.ss0)"
+             description="Percentage of time when HDC has messges to L3, but it's stalled due to lack of credits (s0.ss0)"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ C 6 READ USUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader00_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader00AccessStalledOnL3"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x104F0232" />
+        <register type="NOA" address="0x00009888" value="0x124F4640" />
+        <register type="NOA" address="0x00009888" value="0x106C0232" />
+        <register type="NOA" address="0x00009888" value="0x11834400" />
+        <register type="NOA" address="0x00009888" value="0x0A4E8000" />
+        <register type="NOA" address="0x00009888" value="0x0C4E8000" />
+        <register type="NOA" address="0x00009888" value="0x004F1880" />
+        <register type="NOA" address="0x00009888" value="0x024F08BB" />
+        <register type="NOA" address="0x00009888" value="0x044F001B" />
+        <register type="NOA" address="0x00009888" value="0x046C0100" />
+        <register type="NOA" address="0x00009888" value="0x066C000B" />
+        <register type="NOA" address="0x00009888" value="0x1A6C0000" />
+        <register type="NOA" address="0x00009888" value="0x041B8000" />
+        <register type="NOA" address="0x00009888" value="0x061B4000" />
+        <register type="NOA" address="0x00009888" value="0x1A1C1800" />
+        <register type="NOA" address="0x00009888" value="0x005B8000" />
+        <register type="NOA" address="0x00009888" value="0x025BC000" />
+        <register type="NOA" address="0x00009888" value="0x045B4000" />
+        <register type="NOA" address="0x00009888" value="0x125C8000" />
+        <register type="NOA" address="0x00009888" value="0x145C8000" />
+        <register type="NOA" address="0x00009888" value="0x165C8000" />
+        <register type="NOA" address="0x00009888" value="0x185C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C00A0" />
+        <register type="NOA" address="0x00009888" value="0x000D8000" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F5000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0055" />
+        <register type="NOA" address="0x00009888" value="0x022CC000" />
+        <register type="NOA" address="0x00009888" value="0x042CC000" />
+        <register type="NOA" address="0x00009888" value="0x062CC000" />
+        <register type="NOA" address="0x00009888" value="0x082CC000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0F828000" />
+        <register type="NOA" address="0x00009888" value="0x0F8305C0" />
+        <register type="NOA" address="0x00009888" value="0x09830000" />
+        <register type="NOA" address="0x00009888" value="0x07830000" />
+        <register type="NOA" address="0x00009888" value="0x1D950080" />
+        <register type="NOA" address="0x00009888" value="0x13928000" />
+        <register type="NOA" address="0x00009888" value="0x0F988000" />
+        <register type="NOA" address="0x00009888" value="0x31904000" />
+        <register type="NOA" address="0x00009888" value="0x1190FC00" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900040" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900800" />
+        <register type="NOA" address="0x00009888" value="0x43900842" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x10800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00000002" />
+        <register type="OA" address="0x00002774" value="0x0000FDFF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set L3_1"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="l3_1"
+       hw_config_guid="a35c5867-0ab8-4d45-8fc1-eb0906f0eff5"
+       chipset="CFLGT2"
+       symbol_name="L3_1"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank1 Active"
+             description="The percentage of time in which slice0 L3 bank1 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank1_active"
+             units="percent"
+             symbol_name="L30Bank1Active"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="Slice0 L3 Bank1 Stalled"
+             description="The percentage of time in which slice0 L3 bank1 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank1_stalled"
+             units="percent"
+             symbol_name="L30Bank1Stalled"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank0 Active"
+             description="The percentage of time in which slice0 L3 bank0 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank0_active"
+             units="percent"
+             symbol_name="L30Bank0Active"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank0 Stalled"
+             description="The percentage of time in which slice0 L3 bank0 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank0_stalled"
+             units="percent"
+             symbol_name="L30Bank0Stalled"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x126C7B40" />
+        <register type="NOA" address="0x00009888" value="0x166C0020" />
+        <register type="NOA" address="0x00009888" value="0x0A603444" />
+        <register type="NOA" address="0x00009888" value="0x0A613400" />
+        <register type="NOA" address="0x00009888" value="0x1A4EA800" />
+        <register type="NOA" address="0x00009888" value="0x1C4E0002" />
+        <register type="NOA" address="0x00009888" value="0x024E8000" />
+        <register type="NOA" address="0x00009888" value="0x044E8000" />
+        <register type="NOA" address="0x00009888" value="0x064E8000" />
+        <register type="NOA" address="0x00009888" value="0x084E8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4E8000" />
+        <register type="NOA" address="0x00009888" value="0x064F4000" />
+        <register type="NOA" address="0x00009888" value="0x0C6C5327" />
+        <register type="NOA" address="0x00009888" value="0x0E6C5425" />
+        <register type="NOA" address="0x00009888" value="0x006C2A00" />
+        <register type="NOA" address="0x00009888" value="0x026C285B" />
+        <register type="NOA" address="0x00009888" value="0x046C005C" />
+        <register type="NOA" address="0x00009888" value="0x106C0000" />
+        <register type="NOA" address="0x00009888" value="0x1C6C0000" />
+        <register type="NOA" address="0x00009888" value="0x1E6C0000" />
+        <register type="NOA" address="0x00009888" value="0x1A6C0800" />
+        <register type="NOA" address="0x00009888" value="0x0C1BC000" />
+        <register type="NOA" address="0x00009888" value="0x0E1BC000" />
+        <register type="NOA" address="0x00009888" value="0x001B8000" />
+        <register type="NOA" address="0x00009888" value="0x021BC000" />
+        <register type="NOA" address="0x00009888" value="0x041BC000" />
+        <register type="NOA" address="0x00009888" value="0x1C1C003C" />
+        <register type="NOA" address="0x00009888" value="0x121C8000" />
+        <register type="NOA" address="0x00009888" value="0x141C8000" />
+        <register type="NOA" address="0x00009888" value="0x161C8000" />
+        <register type="NOA" address="0x00009888" value="0x181C8000" />
+        <register type="NOA" address="0x00009888" value="0x1A1C0800" />
+        <register type="NOA" address="0x00009888" value="0x065B4000" />
+        <register type="NOA" address="0x00009888" value="0x1A5C1000" />
+        <register type="NOA" address="0x00009888" value="0x10600000" />
+        <register type="NOA" address="0x00009888" value="0x04600000" />
+        <register type="NOA" address="0x00009888" value="0x0C610044" />
+        <register type="NOA" address="0x00009888" value="0x10610000" />
+        <register type="NOA" address="0x00009888" value="0x06610000" />
+        <register type="NOA" address="0x00009888" value="0x0C4C02A8" />
+        <register type="NOA" address="0x00009888" value="0x084CA000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C002A" />
+        <register type="NOA" address="0x00009888" value="0x0C0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0E0DA000" />
+        <register type="NOA" address="0x00009888" value="0x000D8000" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x100F0154" />
+        <register type="NOA" address="0x00009888" value="0x0C0F5000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0055" />
+        <register type="NOA" address="0x00009888" value="0x182C00AA" />
+        <register type="NOA" address="0x00009888" value="0x022C8000" />
+        <register type="NOA" address="0x00009888" value="0x042C8000" />
+        <register type="NOA" address="0x00009888" value="0x062C8000" />
+        <register type="NOA" address="0x00009888" value="0x082C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C2CC000" />
+        <register type="NOA" address="0x00009888" value="0x1190FFC0" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900420" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900021" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900400" />
+        <register type="NOA" address="0x00009888" value="0x43900421" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900040" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002770" value="0x00100070" />
+        <register type="OA" address="0x00002774" value="0x0000FFF1" />
+        <register type="OA" address="0x00002778" value="0x00014002" />
+        <register type="OA" address="0x0000277C" value="0x0000C3FF" />
+        <register type="OA" address="0x00002780" value="0x00010002" />
+        <register type="OA" address="0x00002784" value="0x0000C7FF" />
+        <register type="OA" address="0x00002788" value="0x00004002" />
+        <register type="OA" address="0x0000278C" value="0x0000D3FF" />
+        <register type="OA" address="0x00002790" value="0x00100700" />
+        <register type="OA" address="0x00002794" value="0x0000FF1F" />
+        <register type="OA" address="0x00002798" value="0x00001402" />
+        <register type="OA" address="0x0000279C" value="0x0000FC3F" />
+        <register type="OA" address="0x000027A0" value="0x00001002" />
+        <register type="OA" address="0x000027A4" value="0x0000FC7F" />
+        <register type="OA" address="0x000027A8" value="0x00000402" />
+        <register type="OA" address="0x000027AC" value="0x0000FD3F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set L3_2"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="l3_2"
+       hw_config_guid="bb4bcce9-2cbb-4818-9e49-67ce2c99cd25"
+       chipset="CFLGT2"
+       symbol_name="L3_2"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank2 Stalled"
+             description="The percentage of time in which slice0 L3 bank2 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank2_stalled"
+             units="percent"
+             symbol_name="L30Bank2Stalled"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank2 Active"
+             description="The percentage of time in which slice0 L3 bank2 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank2_active"
+             units="percent"
+             symbol_name="L30Bank2Active"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x126C02E0" />
+        <register type="NOA" address="0x00009888" value="0x146C0001" />
+        <register type="NOA" address="0x00009888" value="0x0A623400" />
+        <register type="NOA" address="0x00009888" value="0x044E8000" />
+        <register type="NOA" address="0x00009888" value="0x064E8000" />
+        <register type="NOA" address="0x00009888" value="0x084E8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4E8000" />
+        <register type="NOA" address="0x00009888" value="0x064F4000" />
+        <register type="NOA" address="0x00009888" value="0x026C3324" />
+        <register type="NOA" address="0x00009888" value="0x046C3422" />
+        <register type="NOA" address="0x00009888" value="0x106C0000" />
+        <register type="NOA" address="0x00009888" value="0x1A6C0000" />
+        <register type="NOA" address="0x00009888" value="0x021BC000" />
+        <register type="NOA" address="0x00009888" value="0x041BC000" />
+        <register type="NOA" address="0x00009888" value="0x141C8000" />
+        <register type="NOA" address="0x00009888" value="0x161C8000" />
+        <register type="NOA" address="0x00009888" value="0x181C8000" />
+        <register type="NOA" address="0x00009888" value="0x1A1C0800" />
+        <register type="NOA" address="0x00009888" value="0x065B4000" />
+        <register type="NOA" address="0x00009888" value="0x1A5C1000" />
+        <register type="NOA" address="0x00009888" value="0x06614000" />
+        <register type="NOA" address="0x00009888" value="0x0C620044" />
+        <register type="NOA" address="0x00009888" value="0x10620000" />
+        <register type="NOA" address="0x00009888" value="0x06620000" />
+        <register type="NOA" address="0x00009888" value="0x084C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C002A" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F4000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0055" />
+        <register type="NOA" address="0x00009888" value="0x042C8000" />
+        <register type="NOA" address="0x00009888" value="0x062C8000" />
+        <register type="NOA" address="0x00009888" value="0x082C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C2CC000" />
+        <register type="NOA" address="0x00009888" value="0x1190F800" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x43900000" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00100070" />
+        <register type="OA" address="0x00002774" value="0x0000FFF1" />
+        <register type="OA" address="0x00002778" value="0x00028002" />
+        <register type="OA" address="0x0000277C" value="0x000087FF" />
+        <register type="OA" address="0x00002780" value="0x00020002" />
+        <register type="OA" address="0x00002784" value="0x00008FFF" />
+        <register type="OA" address="0x00002788" value="0x00008002" />
+        <register type="OA" address="0x0000278C" value="0x0000A7FF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set L3_3"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="l3_3"
+       hw_config_guid="9e1229f8-d87f-4f44-b067-3544e17195aa"
+       chipset="CFLGT2"
+       symbol_name="L3_3"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Slice0 L3 Bank3 Stalled"
+             description="The percentage of time in which slice0 L3 bank3 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank3_stalled"
+             units="percent"
+             symbol_name="L30Bank3Stalled"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank3 Active"
+             description="The percentage of time in which slice0 L3 bank3 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank3_active"
+             units="percent"
+             symbol_name="L30Bank3Active"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x126C4E80" />
+        <register type="NOA" address="0x00009888" value="0x146C0000" />
+        <register type="NOA" address="0x00009888" value="0x0A633400" />
+        <register type="NOA" address="0x00009888" value="0x044E8000" />
+        <register type="NOA" address="0x00009888" value="0x064E8000" />
+        <register type="NOA" address="0x00009888" value="0x084E8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4E8000" />
+        <register type="NOA" address="0x00009888" value="0x0C4E8000" />
+        <register type="NOA" address="0x00009888" value="0x026C3321" />
+        <register type="NOA" address="0x00009888" value="0x046C342F" />
+        <register type="NOA" address="0x00009888" value="0x106C0000" />
+        <register type="NOA" address="0x00009888" value="0x1A6C2000" />
+        <register type="NOA" address="0x00009888" value="0x021BC000" />
+        <register type="NOA" address="0x00009888" value="0x041BC000" />
+        <register type="NOA" address="0x00009888" value="0x061B4000" />
+        <register type="NOA" address="0x00009888" value="0x141C8000" />
+        <register type="NOA" address="0x00009888" value="0x161C8000" />
+        <register type="NOA" address="0x00009888" value="0x181C8000" />
+        <register type="NOA" address="0x00009888" value="0x1A1C1800" />
+        <register type="NOA" address="0x00009888" value="0x06604000" />
+        <register type="NOA" address="0x00009888" value="0x0C630044" />
+        <register type="NOA" address="0x00009888" value="0x10630000" />
+        <register type="NOA" address="0x00009888" value="0x06630000" />
+        <register type="NOA" address="0x00009888" value="0x084C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C00AA" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F4000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0055" />
+        <register type="NOA" address="0x00009888" value="0x042C8000" />
+        <register type="NOA" address="0x00009888" value="0x062C8000" />
+        <register type="NOA" address="0x00009888" value="0x082C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C2C8000" />
+        <register type="NOA" address="0x00009888" value="0x1190F800" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x43900842" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900002" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00100070" />
+        <register type="OA" address="0x00002774" value="0x0000FFF1" />
+        <register type="OA" address="0x00002778" value="0x00028002" />
+        <register type="OA" address="0x0000277C" value="0x000087FF" />
+        <register type="OA" address="0x00002780" value="0x00020002" />
+        <register type="OA" address="0x00002784" value="0x00008FFF" />
+        <register type="OA" address="0x00002788" value="0x00008002" />
+        <register type="OA" address="0x0000278C" value="0x0000A7FF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set RasterizerAndPixelBackend"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="rasterizer_and_pixel_backend"
+       hw_config_guid="3e91908a-1c70-4004-b2ab-a10ef14f24f9"
+       chipset="CFLGT2"
+       symbol_name="RasterizerAndPixelBackend"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Slice0 Pixel Values Ready"
+             description="The percentage of time in which slice0 pixel values are ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="pixel_values0_ready"
+             units="percent"
+             symbol_name="PixelValues0Ready"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="Slice0 Rasterizer Input Available"
+             description="The percentage of time in which slice0 rasterizer input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="rasterizer0_input_available"
+             units="percent"
+             symbol_name="Rasterizer0InputAvailable"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Slice0 Post-EarlyZ Pixel Data Ready"
+             description="The percentage of time in which slice0 post-EarlyZ pixel data is ready (after early Z tests have been applied)"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="pixel_data0_ready"
+             units="percent"
+             symbol_name="PixelData0Ready"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer/Early Depth Test"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 Rasterizer Output Ready"
+             description="The percentage of time in which slice0 rasterizer output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="rasterizer0_output_ready"
+             units="percent"
+             symbol_name="Rasterizer0OutputReady"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Slice0 PS Output Available"
+             description="The percentage of time in which slice0 PS output is available"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_output0_available"
+             units="percent"
+             symbol_name="PSOutput0Available"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x102F3800" />
+        <register type="NOA" address="0x00009888" value="0x144D0500" />
+        <register type="NOA" address="0x00009888" value="0x120D03C0" />
+        <register type="NOA" address="0x00009888" value="0x140D03CF" />
+        <register type="NOA" address="0x00009888" value="0x0C0F0004" />
+        <register type="NOA" address="0x00009888" value="0x0C4E4000" />
+        <register type="NOA" address="0x00009888" value="0x042F0480" />
+        <register type="NOA" address="0x00009888" value="0x082F0000" />
+        <register type="NOA" address="0x00009888" value="0x022F0000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C0090" />
+        <register type="NOA" address="0x00009888" value="0x064D0027" />
+        <register type="NOA" address="0x00009888" value="0x004D0000" />
+        <register type="NOA" address="0x00009888" value="0x000D0D40" />
+        <register type="NOA" address="0x00009888" value="0x020D803F" />
+        <register type="NOA" address="0x00009888" value="0x040D8023" />
+        <register type="NOA" address="0x00009888" value="0x100D0000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x020F0010" />
+        <register type="NOA" address="0x00009888" value="0x000F0000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0050" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C2C8000" />
+        <register type="NOA" address="0x00009888" value="0x1190FC00" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41901400" />
+        <register type="NOA" address="0x00009888" value="0x43901485" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900001" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x30800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00000002" />
+        <register type="OA" address="0x00002774" value="0x0000EFFF" />
+        <register type="OA" address="0x00002778" value="0x00006000" />
+        <register type="OA" address="0x0000277C" value="0x0000F3FF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set Sampler"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="sampler"
+       hw_config_guid="9a6ba957-7955-4a09-a8ce-083030ba3c1f"
+       chipset="CFLGT2"
+       symbol_name="Sampler"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 Subslice2 Input Available"
+             description="The percentage of time in which slice0 subslice2 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler02_input_available"
+             units="percent"
+             symbol_name="Sampler02InputAvailable"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 Subslice0 Input Available"
+             description="The percentage of time in which slice0 subslice0 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler00_input_available"
+             units="percent"
+             symbol_name="Sampler00InputAvailable"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="Slice0 Subslice2 Sampler Output Ready"
+             description="The percentage of time in which slice0 subslice2 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler02_output_ready"
+             units="percent"
+             symbol_name="Sampler02OutputReady"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Slice0 Subslice1 Input Available"
+             description="The percentage of time in which slice0 subslice1 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler01_input_available"
+             units="percent"
+             symbol_name="Sampler01InputAvailable"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Slice0 Subslice0 Sampler Output Ready"
+             description="The percentage of time in which slice0 subslice0 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler00_output_ready"
+             units="percent"
+             symbol_name="Sampler00OutputReady"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Slice0 Subslice1 Sampler Output Ready"
+             description="The percentage of time in which slice0 subslice1 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler01_output_ready"
+             units="percent"
+             symbol_name="Sampler01OutputReady"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x14152C00" />
+        <register type="NOA" address="0x00009888" value="0x16150005" />
+        <register type="NOA" address="0x00009888" value="0x121600A0" />
+        <register type="NOA" address="0x00009888" value="0x14352C00" />
+        <register type="NOA" address="0x00009888" value="0x16350005" />
+        <register type="NOA" address="0x00009888" value="0x123600A0" />
+        <register type="NOA" address="0x00009888" value="0x14552C00" />
+        <register type="NOA" address="0x00009888" value="0x16550005" />
+        <register type="NOA" address="0x00009888" value="0x125600A0" />
+        <register type="NOA" address="0x00009888" value="0x062F6000" />
+        <register type="NOA" address="0x00009888" value="0x022F2000" />
+        <register type="NOA" address="0x00009888" value="0x0C4C0050" />
+        <register type="NOA" address="0x00009888" value="0x0A4C0010" />
+        <register type="NOA" address="0x00009888" value="0x0C0D8000" />
+        <register type="NOA" address="0x00009888" value="0x0E0DA000" />
+        <register type="NOA" address="0x00009888" value="0x000D8000" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x100F0350" />
+        <register type="NOA" address="0x00009888" value="0x0C0FB000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F00DA" />
+        <register type="NOA" address="0x00009888" value="0x182C0028" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x022DC000" />
+        <register type="NOA" address="0x00009888" value="0x042D4000" />
+        <register type="NOA" address="0x00009888" value="0x0C138000" />
+        <register type="NOA" address="0x00009888" value="0x0E132000" />
+        <register type="NOA" address="0x00009888" value="0x0413C000" />
+        <register type="NOA" address="0x00009888" value="0x1C140018" />
+        <register type="NOA" address="0x00009888" value="0x0C157000" />
+        <register type="NOA" address="0x00009888" value="0x0E150078" />
+        <register type="NOA" address="0x00009888" value="0x10150000" />
+        <register type="NOA" address="0x00009888" value="0x04162180" />
+        <register type="NOA" address="0x00009888" value="0x02160000" />
+        <register type="NOA" address="0x00009888" value="0x04174000" />
+        <register type="NOA" address="0x00009888" value="0x0233A000" />
+        <register type="NOA" address="0x00009888" value="0x04333000" />
+        <register type="NOA" address="0x00009888" value="0x14348000" />
+        <register type="NOA" address="0x00009888" value="0x16348000" />
+        <register type="NOA" address="0x00009888" value="0x02357870" />
+        <register type="NOA" address="0x00009888" value="0x10350000" />
+        <register type="NOA" address="0x00009888" value="0x04360043" />
+        <register type="NOA" address="0x00009888" value="0x02360000" />
+        <register type="NOA" address="0x00009888" value="0x04371000" />
+        <register type="NOA" address="0x00009888" value="0x0E538000" />
+        <register type="NOA" address="0x00009888" value="0x00538000" />
+        <register type="NOA" address="0x00009888" value="0x06533000" />
+        <register type="NOA" address="0x00009888" value="0x1C540020" />
+        <register type="NOA" address="0x00009888" value="0x12548000" />
+        <register type="NOA" address="0x00009888" value="0x0E557000" />
+        <register type="NOA" address="0x00009888" value="0x00557800" />
+        <register type="NOA" address="0x00009888" value="0x10550000" />
+        <register type="NOA" address="0x00009888" value="0x06560043" />
+        <register type="NOA" address="0x00009888" value="0x02560000" />
+        <register type="NOA" address="0x00009888" value="0x06571000" />
+        <register type="NOA" address="0x00009888" value="0x1190FF80" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900060" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900C00" />
+        <register type="NOA" address="0x00009888" value="0x43900842" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900060" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x70800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x0000C000" />
+        <register type="OA" address="0x00002774" value="0x0000E7FF" />
+        <register type="OA" address="0x00002778" value="0x00003000" />
+        <register type="OA" address="0x0000277C" value="0x0000F9FF" />
+        <register type="OA" address="0x00002780" value="0x00000C00" />
+        <register type="OA" address="0x00002784" value="0x0000FE7F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set TDL_1"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="tdl_1"
+       hw_config_guid="c54e7ca3-c60c-4396-ac3d-f9899c9a6ee4"
+       chipset="CFLGT2"
+       symbol_name="TDL_1"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="NonPS Thread Ready For Dispatch on Slice0 Subslice2"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice2 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread02_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread02ReadyForDispatch"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="NonPS Thread Ready For Dispatch on Slice0 Subslice0"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice0 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread00_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread00ReadyForDispatch"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Subslice0"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice0 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread00_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread00ReadyForDispatch"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Subslice1"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice1 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread01_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread01ReadyForDispatch"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Subslice2"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice2 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread02_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread02ReadyForDispatch"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="NonPS Thread Ready For Dispatch on Slice0 Subslice1"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice1 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread01_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread01ReadyForDispatch"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x12120000" />
+        <register type="NOA" address="0x00009888" value="0x12320000" />
+        <register type="NOA" address="0x00009888" value="0x12520000" />
+        <register type="NOA" address="0x00009888" value="0x002F8000" />
+        <register type="NOA" address="0x00009888" value="0x022F3000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C0015" />
+        <register type="NOA" address="0x00009888" value="0x0C0D8000" />
+        <register type="NOA" address="0x00009888" value="0x0E0DA000" />
+        <register type="NOA" address="0x00009888" value="0x000D8000" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x100F03A0" />
+        <register type="NOA" address="0x00009888" value="0x0C0FF000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0095" />
+        <register type="NOA" address="0x00009888" value="0x062C8000" />
+        <register type="NOA" address="0x00009888" value="0x082C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C2D8000" />
+        <register type="NOA" address="0x00009888" value="0x0E2D4000" />
+        <register type="NOA" address="0x00009888" value="0x062D4000" />
+        <register type="NOA" address="0x00009888" value="0x02108000" />
+        <register type="NOA" address="0x00009888" value="0x0410C000" />
+        <register type="NOA" address="0x00009888" value="0x02118000" />
+        <register type="NOA" address="0x00009888" value="0x0411C000" />
+        <register type="NOA" address="0x00009888" value="0x02121880" />
+        <register type="NOA" address="0x00009888" value="0x041219B5" />
+        <register type="NOA" address="0x00009888" value="0x00120000" />
+        <register type="NOA" address="0x00009888" value="0x02134000" />
+        <register type="NOA" address="0x00009888" value="0x04135000" />
+        <register type="NOA" address="0x00009888" value="0x0C308000" />
+        <register type="NOA" address="0x00009888" value="0x0E304000" />
+        <register type="NOA" address="0x00009888" value="0x06304000" />
+        <register type="NOA" address="0x00009888" value="0x0C318000" />
+        <register type="NOA" address="0x00009888" value="0x0E314000" />
+        <register type="NOA" address="0x00009888" value="0x06314000" />
+        <register type="NOA" address="0x00009888" value="0x0C321A80" />
+        <register type="NOA" address="0x00009888" value="0x0E320033" />
+        <register type="NOA" address="0x00009888" value="0x06320031" />
+        <register type="NOA" address="0x00009888" value="0x00320000" />
+        <register type="NOA" address="0x00009888" value="0x0C334000" />
+        <register type="NOA" address="0x00009888" value="0x0E331000" />
+        <register type="NOA" address="0x00009888" value="0x06331000" />
+        <register type="NOA" address="0x00009888" value="0x0E508000" />
+        <register type="NOA" address="0x00009888" value="0x00508000" />
+        <register type="NOA" address="0x00009888" value="0x02504000" />
+        <register type="NOA" address="0x00009888" value="0x0E518000" />
+        <register type="NOA" address="0x00009888" value="0x00518000" />
+        <register type="NOA" address="0x00009888" value="0x02514000" />
+        <register type="NOA" address="0x00009888" value="0x0E521880" />
+        <register type="NOA" address="0x00009888" value="0x00521A80" />
+        <register type="NOA" address="0x00009888" value="0x02520033" />
+        <register type="NOA" address="0x00009888" value="0x0E534000" />
+        <register type="NOA" address="0x00009888" value="0x00534000" />
+        <register type="NOA" address="0x00009888" value="0x02531000" />
+        <register type="NOA" address="0x00009888" value="0x1190FF80" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900800" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900062" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900C00" />
+        <register type="NOA" address="0x00009888" value="0x43900003" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900040" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x30800000" />
+        <register type="OA" address="0x00002770" value="0x00000002" />
+        <register type="OA" address="0x00002774" value="0x00007FFF" />
+        <register type="OA" address="0x00002778" value="0x00000000" />
+        <register type="OA" address="0x0000277C" value="0x00009FFF" />
+        <register type="OA" address="0x00002780" value="0x00000002" />
+        <register type="OA" address="0x00002784" value="0x0000EFFF" />
+        <register type="OA" address="0x00002788" value="0x00000000" />
+        <register type="OA" address="0x0000278C" value="0x0000F3FF" />
+        <register type="OA" address="0x00002790" value="0x00000002" />
+        <register type="OA" address="0x00002794" value="0x0000FDFF" />
+        <register type="OA" address="0x00002798" value="0x00000000" />
+        <register type="OA" address="0x0000279C" value="0x0000FE7F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set TDL_2"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="tdl_2"
+       hw_config_guid="e438cd5d-1da7-46c6-9823-4780f370d11d"
+       chipset="CFLGT2"
+       symbol_name="TDL_2"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice1 Port 0"
+             description="The percentage of time in which thread header is ready on slice0 subslice1 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header01_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader01ReadyPort0"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice1 Port 1"
+             description="The percentage of time in which thread header is ready on slice0 subslice1 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header01_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader01ReadyPort1"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice2 Port 1"
+             description="The percentage of time in which thread header is ready on slice0 subslice2 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header02_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader02ReadyPort1"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice2 Port 0"
+             description="The percentage of time in which thread header is ready on slice0 subslice2 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header02_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader02ReadyPort0"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice0 Port 0"
+             description="The percentage of time in which thread header is ready on slice0 subslice0 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header00_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader00ReadyPort0"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice0 Port 1"
+             description="The percentage of time in which thread header is ready on slice0 subslice0 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header00_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader00ReadyPort1"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x12124D60" />
+        <register type="NOA" address="0x00009888" value="0x12322E60" />
+        <register type="NOA" address="0x00009888" value="0x12524D60" />
+        <register type="NOA" address="0x00009888" value="0x022F3000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C0014" />
+        <register type="NOA" address="0x00009888" value="0x000D8000" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x0C0FE000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0097" />
+        <register type="NOA" address="0x00009888" value="0x082C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x002D8000" />
+        <register type="NOA" address="0x00009888" value="0x062D4000" />
+        <register type="NOA" address="0x00009888" value="0x0410C000" />
+        <register type="NOA" address="0x00009888" value="0x0411C000" />
+        <register type="NOA" address="0x00009888" value="0x04121FB7" />
+        <register type="NOA" address="0x00009888" value="0x00120000" />
+        <register type="NOA" address="0x00009888" value="0x04135000" />
+        <register type="NOA" address="0x00009888" value="0x00308000" />
+        <register type="NOA" address="0x00009888" value="0x06304000" />
+        <register type="NOA" address="0x00009888" value="0x00318000" />
+        <register type="NOA" address="0x00009888" value="0x06314000" />
+        <register type="NOA" address="0x00009888" value="0x00321B80" />
+        <register type="NOA" address="0x00009888" value="0x0632003F" />
+        <register type="NOA" address="0x00009888" value="0x00334000" />
+        <register type="NOA" address="0x00009888" value="0x06331000" />
+        <register type="NOA" address="0x00009888" value="0x0250C000" />
+        <register type="NOA" address="0x00009888" value="0x0251C000" />
+        <register type="NOA" address="0x00009888" value="0x02521FB7" />
+        <register type="NOA" address="0x00009888" value="0x00520000" />
+        <register type="NOA" address="0x00009888" value="0x02535000" />
+        <register type="NOA" address="0x00009888" value="0x1190FC00" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900800" />
+        <register type="NOA" address="0x00009888" value="0x43900063" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900040" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Compute Metrics Extra Gen9"
+       mdapi_supported_apis="VK OGL4 OCL IO BB"
+       underscore_name="compute_extra"
+       hw_config_guid="5f679fb0-909e-4c0e-b4b2-8e801f83e71b"
+       chipset="CFLGT2"
+       symbol_name="ComputeExtra"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active"
+             units="percent"
+             symbol_name="Fpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Pipe Active including Ext Math"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing including Extended Math processing"
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ  C 7 READ C 6 READ FADD C 5 READ FADD 8 FMUL FADD 100 FMUL $EuCoresTotalCount FDIV $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active_adjusted"
+             units="percent"
+             symbol_name="Fpu1ActiveAdjusted"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x121203E0" />
+        <register type="NOA" address="0x00009888" value="0x123203E0" />
+        <register type="NOA" address="0x00009888" value="0x125203E0" />
+        <register type="NOA" address="0x00009888" value="0x022F4000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C0040" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F006C" />
+        <register type="NOA" address="0x00009888" value="0x0C2C8000" />
+        <register type="NOA" address="0x00009888" value="0x042D8000" />
+        <register type="NOA" address="0x00009888" value="0x06104000" />
+        <register type="NOA" address="0x00009888" value="0x06114000" />
+        <register type="NOA" address="0x00009888" value="0x06120033" />
+        <register type="NOA" address="0x00009888" value="0x00120000" />
+        <register type="NOA" address="0x00009888" value="0x06131000" />
+        <register type="NOA" address="0x00009888" value="0x04308000" />
+        <register type="NOA" address="0x00009888" value="0x04318000" />
+        <register type="NOA" address="0x00009888" value="0x04321980" />
+        <register type="NOA" address="0x00009888" value="0x00320000" />
+        <register type="NOA" address="0x00009888" value="0x04334000" />
+        <register type="NOA" address="0x00009888" value="0x04504000" />
+        <register type="NOA" address="0x00009888" value="0x04514000" />
+        <register type="NOA" address="0x00009888" value="0x04520033" />
+        <register type="NOA" address="0x00009888" value="0x00520000" />
+        <register type="NOA" address="0x00009888" value="0x04531000" />
+        <register type="NOA" address="0x00009888" value="0x1190E000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x43900C00" />
+        <register type="NOA" address="0x00009888" value="0x45900002" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00001000" />
+        <register type="FLEX" address="0x0000E558" value="0x00003002" />
+        <register type="FLEX" address="0x0000E658" value="0x00005004" />
+        <register type="FLEX" address="0x0000E758" value="0x00011010" />
+        <register type="FLEX" address="0x0000E45C" value="0x00050012" />
+        <register type="FLEX" address="0x0000E55C" value="0x00052051" />
+        <register type="FLEX" address="0x0000E65C" value="0x00000008" />
+    </register_config>
+  </set>
+
+  <set name="Media Vme Pipe Gen9"
+       mdapi_supported_apis="MEDIA IO BB"
+       underscore_name="vme_pipe"
+       hw_config_guid="0d09ba9a-1d1c-457d-83e2-74ac448014d6"
+       chipset="CFLGT2"
+       symbol_name="VMEPipe"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="EU Thread Occupancy"
+             description="The percentage of time in which hardware threads occupied EUs."
+             data_type="float"
+             max_equation="100"
+             equation="8 A 10 READ FMUL $EuThreadsCount FDIV $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_thread_occupancy"
+             units="percent"
+             symbol_name="EuThreadOccupancy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VME Busy"
+             description="The percentage of time in which VME (IME or CRE) was actively processing data."
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ B 3 READ FADD 2 FDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vme_busy"
+             units="percent"
+             symbol_name="VMEBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Overview System Batch Tier2"
+             mdapi_group="VME Pipe"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x141A5800" />
+        <register type="NOA" address="0x00009888" value="0x161A00C0" />
+        <register type="NOA" address="0x00009888" value="0x12180240" />
+        <register type="NOA" address="0x00009888" value="0x14180002" />
+        <register type="NOA" address="0x00009888" value="0x143A5800" />
+        <register type="NOA" address="0x00009888" value="0x163A00C0" />
+        <register type="NOA" address="0x00009888" value="0x12380240" />
+        <register type="NOA" address="0x00009888" value="0x14380002" />
+        <register type="NOA" address="0x00009888" value="0x002F1000" />
+        <register type="NOA" address="0x00009888" value="0x022F8000" />
+        <register type="NOA" address="0x00009888" value="0x042F3000" />
+        <register type="NOA" address="0x00009888" value="0x004C4000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C1500" />
+        <register type="NOA" address="0x00009888" value="0x000D2000" />
+        <register type="NOA" address="0x00009888" value="0x060D8000" />
+        <register type="NOA" address="0x00009888" value="0x080DA000" />
+        <register type="NOA" address="0x00009888" value="0x0A0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F0400" />
+        <register type="NOA" address="0x00009888" value="0x0E0F9500" />
+        <register type="NOA" address="0x00009888" value="0x100F002A" />
+        <register type="NOA" address="0x00009888" value="0x002C8000" />
+        <register type="NOA" address="0x00009888" value="0x0E2C8000" />
+        <register type="NOA" address="0x00009888" value="0x162C0A00" />
+        <register type="NOA" address="0x00009888" value="0x0A2DC000" />
+        <register type="NOA" address="0x00009888" value="0x0C2DC000" />
+        <register type="NOA" address="0x00009888" value="0x04193000" />
+        <register type="NOA" address="0x00009888" value="0x081A28C1" />
+        <register type="NOA" address="0x00009888" value="0x001A0000" />
+        <register type="NOA" address="0x00009888" value="0x00133000" />
+        <register type="NOA" address="0x00009888" value="0x0613C000" />
+        <register type="NOA" address="0x00009888" value="0x0813F000" />
+        <register type="NOA" address="0x00009888" value="0x00172000" />
+        <register type="NOA" address="0x00009888" value="0x06178000" />
+        <register type="NOA" address="0x00009888" value="0x0817A000" />
+        <register type="NOA" address="0x00009888" value="0x00180037" />
+        <register type="NOA" address="0x00009888" value="0x06180940" />
+        <register type="NOA" address="0x00009888" value="0x08180000" />
+        <register type="NOA" address="0x00009888" value="0x02180000" />
+        <register type="NOA" address="0x00009888" value="0x04183000" />
+        <register type="NOA" address="0x00009888" value="0x06393000" />
+        <register type="NOA" address="0x00009888" value="0x0C3A28C1" />
+        <register type="NOA" address="0x00009888" value="0x003A0000" />
+        <register type="NOA" address="0x00009888" value="0x0A33F000" />
+        <register type="NOA" address="0x00009888" value="0x0C33F000" />
+        <register type="NOA" address="0x00009888" value="0x0A37A000" />
+        <register type="NOA" address="0x00009888" value="0x0C37A000" />
+        <register type="NOA" address="0x00009888" value="0x0A380977" />
+        <register type="NOA" address="0x00009888" value="0x08380000" />
+        <register type="NOA" address="0x00009888" value="0x04380000" />
+        <register type="NOA" address="0x00009888" value="0x06383000" />
+        <register type="NOA" address="0x00009888" value="0x119000FF" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900040" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900800" />
+        <register type="NOA" address="0x00009888" value="0x47901000" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900844" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x30800000" />
+        <register type="OA" address="0x00002770" value="0x00100030" />
+        <register type="OA" address="0x00002774" value="0x0000FFF9" />
+        <register type="OA" address="0x00002778" value="0x00000002" />
+        <register type="OA" address="0x0000277C" value="0x0000FFFC" />
+        <register type="OA" address="0x00002780" value="0x00000002" />
+        <register type="OA" address="0x00002784" value="0x0000FFF3" />
+        <register type="OA" address="0x00002788" value="0x00100180" />
+        <register type="OA" address="0x0000278C" value="0x0000FFCF" />
+        <register type="OA" address="0x00002790" value="0x00000002" />
+        <register type="OA" address="0x00002794" value="0x0000FFCF" />
+        <register type="OA" address="0x00002798" value="0x00000002" />
+        <register type="OA" address="0x0000279C" value="0x0000FF3F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00008003" />
+    </register_config>
+  </set>
+
+  <set name="Gpu Rings Busyness"
+       mdapi_supported_apis="VK OGL OCL MEDIA IO BB"
+       underscore_name="gpu_busyness"
+       hw_config_guid="e2f162ae-5732-4af0-8b11-69510f57094a"
+       chipset="CFLGT2"
+       symbol_name="GpuBusyness"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="Vebox Ring Busy"
+             description="The percentage of time when vebox command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vebox_busy"
+             units="percent"
+             symbol_name="VeboxBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Render Ring Busy"
+             description="The percentage of time when render command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="render_busy"
+             units="percent"
+             symbol_name="RenderBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Vdbox0 Ring Busy"
+             description="The percentage of time when Vdbox0 command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vdbox0_busy"
+             units="percent"
+             symbol_name="Vdbox0Busy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Blitter Ring Busy"
+             description="The percentage of time when blitter command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="blitter_busy"
+             units="percent"
+             symbol_name="BlitterBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="AnyRingBusy"
+             description="The percentage of time when any command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="any_ring_busy"
+             units="percent"
+             symbol_name="AnyRingBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x13805800" />
+        <register type="NOA" address="0x00009888" value="0x05962C00" />
+        <register type="NOA" address="0x00009888" value="0x19950016" />
+        <register type="NOA" address="0x00009888" value="0x19C05800" />
+        <register type="NOA" address="0x00009888" value="0x07800035" />
+        <register type="NOA" address="0x00009888" value="0x11800000" />
+        <register type="NOA" address="0x00009888" value="0x1D810400" />
+        <register type="NOA" address="0x00009888" value="0x07960025" />
+        <register type="NOA" address="0x00009888" value="0x21960000" />
+        <register type="NOA" address="0x00009888" value="0x0B964000" />
+        <register type="NOA" address="0x00009888" value="0x1B930062" />
+        <register type="NOA" address="0x00009888" value="0x17948000" />
+        <register type="NOA" address="0x00009888" value="0x1B940008" />
+        <register type="NOA" address="0x00009888" value="0x05950075" />
+        <register type="NOA" address="0x00009888" value="0x1D950000" />
+        <register type="NOA" address="0x00009888" value="0x07E54000" />
+        <register type="NOA" address="0x00009888" value="0x09924000" />
+        <register type="NOA" address="0x00009888" value="0x05982000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B904000" />
+        <register type="NOA" address="0x00009888" value="0x1D908000" />
+        <register type="NOA" address="0x00009888" value="0x1F908000" />
+        <register type="NOA" address="0x00009888" value="0x09978000" />
+        <register type="NOA" address="0x00009888" value="0x05C08500" />
+        <register type="NOA" address="0x00009888" value="0x25C00000" />
+        <register type="NOA" address="0x00009888" value="0x1BC00000" />
+        <register type="NOA" address="0x00009888" value="0x0BC54000" />
+        <register type="NOA" address="0x00009888" value="0x11900000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x43900C60" />
+        <register type="NOA" address="0x00009888" value="0x45900040" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x10800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00078000" />
+        <register type="OA" address="0x00002774" value="0x00000FFF" />
+    </register_config>
+  </set>
+
+  <set name="MDAPI testing set Gen9.5"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="test_oa"
+       hw_config_guid="74fb4902-d3d3-4237-9e90-cbdc68d0a446"
+       chipset="CFLGT2"
+       symbol_name="TestOa"
+       >
+    <counter name="TestCounter7"
+             description="HW test counter 7. Factor: 0.666"
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="counter7"
+             units="events"
+             symbol_name="Counter7"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="TestCounter8"
+             description="HW test counter 8. Should be equal to 1."
+             data_type="uint64"
+             equation="C 7 READ"
+             underscore_name="counter8"
+             units="events"
+             symbol_name="Counter8"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter4"
+             description="HW test counter 4. Factor: 0.333"
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="counter4"
+             units="events"
+             symbol_name="Counter4"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter5"
+             description="HW test counter 5. Factor: 0.333"
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="counter5"
+             units="events"
+             symbol_name="Counter5"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter6"
+             description="HW test counter 6. Factor: 0.166"
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="counter6"
+             units="events"
+             symbol_name="Counter6"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter3"
+             description="HW test counter 3. Factor: 0.5"
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="counter3"
+             units="events"
+             symbol_name="Counter3"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter0"
+             description="HW test counter 0. Factor: 0.0"
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="counter0"
+             units="events"
+             symbol_name="Counter0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter1"
+             description="HW test counter 1. Factor: 1.0"
+             data_type="uint64"
+             equation="B 1 READ"
+             underscore_name="counter1"
+             units="events"
+             symbol_name="Counter1"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter2"
+             description="HW test counter 2. Factor: 1.0"
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="counter2"
+             units="events"
+             symbol_name="Counter2"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x11810000" />
+        <register type="NOA" address="0x00009888" value="0x07810013" />
+        <register type="NOA" address="0x00009888" value="0x1F810000" />
+        <register type="NOA" address="0x00009888" value="0x1D810000" />
+        <register type="NOA" address="0x00009888" value="0x1B930040" />
+        <register type="NOA" address="0x00009888" value="0x07E54000" />
+        <register type="NOA" address="0x00009888" value="0x1F908000" />
+        <register type="NOA" address="0x00009888" value="0x11900000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x00000004" />
+        <register type="OA" address="0x00002774" value="0x00000000" />
+        <register type="OA" address="0x00002778" value="0x00000003" />
+        <register type="OA" address="0x0000277C" value="0x00000000" />
+        <register type="OA" address="0x00002780" value="0x00000007" />
+        <register type="OA" address="0x00002784" value="0x00000000" />
+        <register type="OA" address="0x00002788" value="0x00100002" />
+        <register type="OA" address="0x0000278C" value="0x0000FFF7" />
+        <register type="OA" address="0x00002790" value="0x00100002" />
+        <register type="OA" address="0x00002794" value="0x0000FFCF" />
+        <register type="OA" address="0x00002798" value="0x00100082" />
+        <register type="OA" address="0x0000279C" value="0x0000FFEF" />
+        <register type="OA" address="0x000027A0" value="0x001000C2" />
+        <register type="OA" address="0x000027A4" value="0x0000FFE7" />
+        <register type="OA" address="0x000027A8" value="0x00100001" />
+        <register type="OA" address="0x000027AC" value="0x0000FFE7" />
+    </register_config>
+  </set>
+
+  <set name="Metric set PMA Stall"
+       mdapi_supported_apis="VK OGL OGL4 OCL IO MEDIA"
+       underscore_name="pma__stall"
+       hw_config_guid="5ccbf9fb-6bf2-456b-a749-bdff7b1aff13"
+       chipset="CFLGT2"
+       symbol_name="PMA_Stall"
+       >
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="STC PMA stall"
+             description="Percentage of time when stencil cache line and an overlapping pixel are causing stalls"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ B 1 READ FADD 2 FDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="stc_pma_stall"
+             units="percent"
+             symbol_name="StcPMAStall"
+             availability="$SliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_group="GPU/Stencil Cache"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x122D3080" />
+        <register type="NOA" address="0x00009888" value="0x000D2000" />
+        <register type="NOA" address="0x00009888" value="0x060D8000" />
+        <register type="NOA" address="0x00009888" value="0x080DA000" />
+        <register type="NOA" address="0x00009888" value="0x0A0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F0800" />
+        <register type="NOA" address="0x00009888" value="0x0E0FAA00" />
+        <register type="NOA" address="0x00009888" value="0x100F0002" />
+        <register type="NOA" address="0x00009888" value="0x002D0025" />
+        <register type="NOA" address="0x00009888" value="0x062D1300" />
+        <register type="NOA" address="0x00009888" value="0x082D16A4" />
+        <register type="NOA" address="0x00009888" value="0x0A2D162E" />
+        <register type="NOA" address="0x00009888" value="0x102D0000" />
+        <register type="NOA" address="0x00009888" value="0x1190003F" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900000" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900000" />
+        <register type="NOA" address="0x00009888" value="0x47900000" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x30800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00E00021" />
+        <register type="OA" address="0x00002774" value="0x0007FFF8" />
+        <register type="OA" address="0x00002778" value="0x07000101" />
+        <register type="OA" address="0x0000277C" value="0x0038FFC7" />
+    </register_config>
+  </set>
+
+</metrics>
diff --git a/lib/i915/perf-configs/oa-cflgt3.xml b/lib/i915/perf-configs/oa-cflgt3.xml
new file mode 100644
index 00000000..497f9990
--- /dev/null
+++ b/lib/i915/perf-configs/oa-cflgt3.xml
@@ -0,0 +1,10933 @@
+<?xml version="1.0"?>
+<metrics version="1581935520" merge_md5="">
+  <set name="Render Metrics Basic Gen9"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="render_basic"
+       hw_config_guid="b316bcab-212f-4228-97de-af6b5a1a2ea1"
+       chipset="CFLGT3"
+       symbol_name="RenderBasic"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Misses"
+             description="The total number of L3 misses."
+             data_type="uint64"
+             equation="C 4 READ"
+             underscore_name="l3_misses"
+             units="messages"
+             symbol_name="L3Misses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/TAG"
+             />
+    <counter name="GTI L3 Throughput"
+             description="The total number of GPU memory bytes transferred between L3 caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="$L3Misses 64 UMUL"
+             underscore_name="gti_l3_throughput"
+             units="bytes"
+             symbol_name="GtiL3Throughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Cache Misses"
+             description="The total number of sampler cache misses in all LODs in all sampler units."
+             data_type="uint64"
+             equation="B 4 READ B 5 READ UADD 8 UMUL"
+             underscore_name="sampler_l1_misses"
+             units="messages"
+             symbol_name="SamplerL1Misses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler 1 Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which Sampler 1 has been slowing down the pipe when processing EU requests."
+             data_type="float"
+             high_watermark="15"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="sampler1_bottleneck"
+             units="percent"
+             symbol_name="Sampler1Bottleneck"
+             availability="$SubsliceMask 0x12 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="L3 Sampler Throughput"
+             description="The total number of GPU memory bytes transferred between samplers and L3 caches."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="$SamplerL1Misses 64 UMUL"
+             underscore_name="l3_sampler_throughput"
+             units="bytes"
+             symbol_name="L3SamplerThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Sampler"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Sampler 0 Busy"
+             description="The percentage of time in which Sampler 0 has been processing EU requests."
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler0_busy"
+             units="percent"
+             symbol_name="Sampler0Busy"
+             availability="$SubsliceMask 0x09 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Sampler 1 Busy"
+             description="The percentage of time in which Sampler 1 has been processing EU requests."
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler1_busy"
+             units="percent"
+             symbol_name="Sampler1Busy"
+             availability="$SubsliceMask 0x12 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Samplers Busy"
+             description="The percentage of time in which samplers have been processing EU requests."
+             data_type="float"
+             max_equation="100"
+             equation="$Sampler0Busy $Sampler1Busy FMAX"
+             underscore_name="samplers_busy"
+             units="percent"
+             symbol_name="SamplersBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="GTI Fixed Pipe Throughput"
+             description="The total number of GPU memory bytes transferred between 3D Pipeline (Command Dispatch, Input Assembly and Stream Output) and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="B 6 READ B 7 READ UADD 64 UMUL"
+             underscore_name="gti_vf_throughput"
+             units="bytes"
+             symbol_name="GtiVfThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/3D Pipe"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler 0 Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which Sampler 0 has been slowing down the pipe when processing EU requests."
+             data_type="float"
+             high_watermark="15"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="sampler0_bottleneck"
+             units="percent"
+             symbol_name="Sampler0Bottleneck"
+             availability="$SubsliceMask 0x09 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="L3 Lookup Accesses w/o IC"
+             description="The total number of L3 cache lookup accesses w/o IC."
+             data_type="uint64"
+             equation="$SamplerL1Misses $ShaderMemoryAccesses UADD"
+             underscore_name="l3_lookups"
+             units="messages"
+             symbol_name="L3Lookups"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/TAG"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Read Throughput"
+             description="The total number of GPU memory bytes read from GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="C 6 READ 64 UMUL"
+             underscore_name="gti_read_throughput"
+             units="bytes"
+             symbol_name="GtiReadThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Depth Throughput"
+             description="The total number of GPU memory bytes transferred between depth caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 0 READ C 1 READ UADD 64 UMUL"
+             underscore_name="gti_depth_throughput"
+             units="bytes"
+             symbol_name="GtiDepthThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/Depth Cache"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Samplers Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which samplers have been slowing down the pipe when processing EU requests."
+             data_type="float"
+             high_watermark="15"
+             equation="$Sampler0Bottleneck $Sampler1Bottleneck FMAX"
+             max_equation="100"
+             underscore_name="sampler_bottleneck"
+             units="percent"
+             symbol_name="SamplerBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Indicate System Frame Batch Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="GTI HDC TLB Lookup Throughput"
+             description="The total number of GPU memory bytes transferred between GTI and HDC, when HDC is doing TLB lookups."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 5 READ 64 UMUL"
+             underscore_name="gti_hdc_lookups_throughput"
+             units="bytes"
+             symbol_name="GtiHdcLookupsThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI RCC Throughput"
+             description="The total number of GPU memory bytes transferred between render color caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 2 READ C 3 READ UADD 64 UMUL"
+             underscore_name="gti_rcc_throughput"
+             units="bytes"
+             symbol_name="GtiRccThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/Color Cache"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="GTI Write Throughput"
+             description="The total number of GPU memory bytes written to GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 32 UMUL"
+             equation="C 7 READ 64 UMUL"
+             underscore_name="gti_write_throughput"
+             units="bytes"
+             symbol_name="GtiWriteThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x166C01E0" />
+        <register type="NOA" address="0x00009888" value="0x12170280" />
+        <register type="NOA" address="0x00009888" value="0x12370280" />
+        <register type="NOA" address="0x00009888" value="0x16EC01E0" />
+        <register type="NOA" address="0x00009888" value="0x11930317" />
+        <register type="NOA" address="0x00009888" value="0x159303DF" />
+        <register type="NOA" address="0x00009888" value="0x3F900003" />
+        <register type="NOA" address="0x00009888" value="0x1A4E0380" />
+        <register type="NOA" address="0x00009888" value="0x0A6C0053" />
+        <register type="NOA" address="0x00009888" value="0x106C0000" />
+        <register type="NOA" address="0x00009888" value="0x1C6C0000" />
+        <register type="NOA" address="0x00009888" value="0x0A1B4000" />
+        <register type="NOA" address="0x00009888" value="0x1C1C0001" />
+        <register type="NOA" address="0x00009888" value="0x002F1000" />
+        <register type="NOA" address="0x00009888" value="0x042F1000" />
+        <register type="NOA" address="0x00009888" value="0x004C4000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C8400" />
+        <register type="NOA" address="0x00009888" value="0x0C4C0002" />
+        <register type="NOA" address="0x00009888" value="0x000D2000" />
+        <register type="NOA" address="0x00009888" value="0x060D8000" />
+        <register type="NOA" address="0x00009888" value="0x080DA000" />
+        <register type="NOA" address="0x00009888" value="0x0A0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F0400" />
+        <register type="NOA" address="0x00009888" value="0x0E0F6600" />
+        <register type="NOA" address="0x00009888" value="0x100F0001" />
+        <register type="NOA" address="0x00009888" value="0x002C8000" />
+        <register type="NOA" address="0x00009888" value="0x162CA200" />
+        <register type="NOA" address="0x00009888" value="0x062D8000" />
+        <register type="NOA" address="0x00009888" value="0x082D8000" />
+        <register type="NOA" address="0x00009888" value="0x00133000" />
+        <register type="NOA" address="0x00009888" value="0x08133000" />
+        <register type="NOA" address="0x00009888" value="0x00170020" />
+        <register type="NOA" address="0x00009888" value="0x08170021" />
+        <register type="NOA" address="0x00009888" value="0x10170000" />
+        <register type="NOA" address="0x00009888" value="0x0633C000" />
+        <register type="NOA" address="0x00009888" value="0x0833C000" />
+        <register type="NOA" address="0x00009888" value="0x06370800" />
+        <register type="NOA" address="0x00009888" value="0x08370840" />
+        <register type="NOA" address="0x00009888" value="0x10370000" />
+        <register type="NOA" address="0x00009888" value="0x1ACE0200" />
+        <register type="NOA" address="0x00009888" value="0x0AEC5300" />
+        <register type="NOA" address="0x00009888" value="0x10EC0000" />
+        <register type="NOA" address="0x00009888" value="0x1CEC0000" />
+        <register type="NOA" address="0x00009888" value="0x0A9B8000" />
+        <register type="NOA" address="0x00009888" value="0x1C9C0002" />
+        <register type="NOA" address="0x00009888" value="0x0CCC0002" />
+        <register type="NOA" address="0x00009888" value="0x0A8D8000" />
+        <register type="NOA" address="0x00009888" value="0x108F0001" />
+        <register type="NOA" address="0x00009888" value="0x16AC8000" />
+        <register type="NOA" address="0x00009888" value="0x0D933031" />
+        <register type="NOA" address="0x00009888" value="0x0F933E3F" />
+        <register type="NOA" address="0x00009888" value="0x01933D00" />
+        <register type="NOA" address="0x00009888" value="0x0393073C" />
+        <register type="NOA" address="0x00009888" value="0x0593000E" />
+        <register type="NOA" address="0x00009888" value="0x1D930000" />
+        <register type="NOA" address="0x00009888" value="0x19930000" />
+        <register type="NOA" address="0x00009888" value="0x1B930000" />
+        <register type="NOA" address="0x00009888" value="0x1D900157" />
+        <register type="NOA" address="0x00009888" value="0x1F900158" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x2B908000" />
+        <register type="NOA" address="0x00009888" value="0x2D908000" />
+        <register type="NOA" address="0x00009888" value="0x2F908000" />
+        <register type="NOA" address="0x00009888" value="0x31908000" />
+        <register type="NOA" address="0x00009888" value="0x15908000" />
+        <register type="NOA" address="0x00009888" value="0x17908000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B908000" />
+        <register type="NOA" address="0x00009888" value="0x1190003F" />
+        <register type="NOA" address="0x00009888" value="0x51902240" />
+        <register type="NOA" address="0x00009888" value="0x41900C00" />
+        <register type="NOA" address="0x00009888" value="0x55900242" />
+        <register type="NOA" address="0x00009888" value="0x45900084" />
+        <register type="NOA" address="0x00009888" value="0x47901400" />
+        <register type="NOA" address="0x00009888" value="0x57902220" />
+        <register type="NOA" address="0x00009888" value="0x49900C60" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900063" />
+        <register type="NOA" address="0x00009888" value="0x59900002" />
+        <register type="NOA" address="0x00009888" value="0x43900C63" />
+        <register type="NOA" address="0x00009888" value="0x53902222" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00222222" />
+    </register_config>
+  </set>
+
+  <set name="Compute Metrics Basic Gen9"
+       mdapi_supported_apis="VK OGL4 OCL IO BB"
+       underscore_name="compute_basic"
+       hw_config_guid="d2eec5b1-4dd8-4170-ae83-9531abd0692f"
+       chipset="CFLGT3"
+       symbol_name="ComputeBasic"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Untyped Bytes Read"
+             description="The total number of typed memory bytes read via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="B 6 READ B 7 READ C 0 READ UADD UADD $EuSlicesTotalCount 64 UMUL UMUL"
+             underscore_name="untyped_bytes_read"
+             units="bytes"
+             symbol_name="UntypedBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Typed Bytes Written"
+             description="The total number of untyped memory bytes written via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="B 3 READ B 4 READ B 5 READ UADD UADD $EuSlicesTotalCount 64 UMUL UMUL"
+             underscore_name="typed_bytes_written"
+             units="bytes"
+             symbol_name="TypedBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu0_active"
+             units="percent"
+             symbol_name="Fpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active"
+             units="percent"
+             symbol_name="Fpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO OCL BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU AVG IPC Rate"
+             description="The average rate of IPC calculated for 2 FPU pipelines."
+             data_type="float"
+             max_equation="2"
+             equation="A 9 READ  A 10 READ  A 11 READ UADD  A 9 READ USUB FDIV 1 FADD"
+             underscore_name="eu_avg_ipc_rate"
+             units="number"
+             symbol_name="EuAvgIpcRate"
+             semantic_type="ratio"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO OCL BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO OCL BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Read Throughput"
+             description="The total number of GPU memory bytes read from GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 4 READ 64 UMUL"
+             underscore_name="gti_read_throughput"
+             units="bytes"
+             symbol_name="GtiReadThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Untyped Writes"
+             description="The total number of untyped memory bytes written via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 1 READ C 2 READ C 3 READ UADD UADD $EuSlicesTotalCount 64 UMUL UMUL"
+             underscore_name="untyped_bytes_written"
+             units="bytes"
+             symbol_name="UntypedBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO OCL BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="Typed Bytes Read"
+             description="The total number of typed memory bytes read via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="B 0 READ B 1 READ B 2 READ UADD UADD $EuSlicesTotalCount 64 UMUL UMUL"
+             underscore_name="typed_bytes_read"
+             units="bytes"
+             symbol_name="TypedBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="EU Thread Occupancy"
+             description="The percentage of time in which hardware threads occupied EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ 8 UMUL $EuCoresTotalCount UDIV $EuThreadsCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_thread_occupancy"
+             units="percent"
+             symbol_name="EuThreadOccupancy"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO OCL BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO OCL BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO OCL BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="GTI Write Throughput"
+             description="The total number of GPU memory bytes written to GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 32 UMUL"
+             equation="C 5 READ 64 UMUL"
+             underscore_name="gti_write_throughput"
+             units="bytes"
+             symbol_name="GtiWriteThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO OCL BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO OCL BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="EU Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_send_active"
+             units="percent"
+             symbol_name="EuSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO OCL BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x104F00E0" />
+        <register type="NOA" address="0x00009888" value="0x124F1C00" />
+        <register type="NOA" address="0x00009888" value="0x106C00E0" />
+        <register type="NOA" address="0x00009888" value="0x37906800" />
+        <register type="NOA" address="0x00009888" value="0x3F900003" />
+        <register type="NOA" address="0x00009888" value="0x004E8000" />
+        <register type="NOA" address="0x00009888" value="0x1A4E0820" />
+        <register type="NOA" address="0x00009888" value="0x1C4E0002" />
+        <register type="NOA" address="0x00009888" value="0x064F0900" />
+        <register type="NOA" address="0x00009888" value="0x084F0032" />
+        <register type="NOA" address="0x00009888" value="0x0A4F1891" />
+        <register type="NOA" address="0x00009888" value="0x0C4F0E00" />
+        <register type="NOA" address="0x00009888" value="0x0E4F003C" />
+        <register type="NOA" address="0x00009888" value="0x004F0D80" />
+        <register type="NOA" address="0x00009888" value="0x024F003B" />
+        <register type="NOA" address="0x00009888" value="0x006C0002" />
+        <register type="NOA" address="0x00009888" value="0x086C0100" />
+        <register type="NOA" address="0x00009888" value="0x0C6C000C" />
+        <register type="NOA" address="0x00009888" value="0x0E6C0B00" />
+        <register type="NOA" address="0x00009888" value="0x186C0000" />
+        <register type="NOA" address="0x00009888" value="0x1C6C0000" />
+        <register type="NOA" address="0x00009888" value="0x1E6C0000" />
+        <register type="NOA" address="0x00009888" value="0x001B4000" />
+        <register type="NOA" address="0x00009888" value="0x081B8000" />
+        <register type="NOA" address="0x00009888" value="0x0C1B4000" />
+        <register type="NOA" address="0x00009888" value="0x0E1B8000" />
+        <register type="NOA" address="0x00009888" value="0x101C8000" />
+        <register type="NOA" address="0x00009888" value="0x1A1C8000" />
+        <register type="NOA" address="0x00009888" value="0x1C1C0024" />
+        <register type="NOA" address="0x00009888" value="0x065B8000" />
+        <register type="NOA" address="0x00009888" value="0x085B4000" />
+        <register type="NOA" address="0x00009888" value="0x0A5BC000" />
+        <register type="NOA" address="0x00009888" value="0x0C5B8000" />
+        <register type="NOA" address="0x00009888" value="0x0E5B4000" />
+        <register type="NOA" address="0x00009888" value="0x005B8000" />
+        <register type="NOA" address="0x00009888" value="0x025B4000" />
+        <register type="NOA" address="0x00009888" value="0x1A5C6000" />
+        <register type="NOA" address="0x00009888" value="0x1C5C001B" />
+        <register type="NOA" address="0x00009888" value="0x125C8000" />
+        <register type="NOA" address="0x00009888" value="0x145C8000" />
+        <register type="NOA" address="0x00009888" value="0x004C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C2000" />
+        <register type="NOA" address="0x00009888" value="0x0C4C0208" />
+        <register type="NOA" address="0x00009888" value="0x000DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D8000" />
+        <register type="NOA" address="0x00009888" value="0x080DA000" />
+        <register type="NOA" address="0x00009888" value="0x0A0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0E0DA000" />
+        <register type="NOA" address="0x00009888" value="0x020D2000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F5400" />
+        <register type="NOA" address="0x00009888" value="0x0E0F5500" />
+        <register type="NOA" address="0x00009888" value="0x100F0155" />
+        <register type="NOA" address="0x00009888" value="0x002C8000" />
+        <register type="NOA" address="0x00009888" value="0x0E2CC000" />
+        <register type="NOA" address="0x00009888" value="0x162CFB00" />
+        <register type="NOA" address="0x00009888" value="0x182C00BE" />
+        <register type="NOA" address="0x00009888" value="0x022CC000" />
+        <register type="NOA" address="0x00009888" value="0x042CC000" />
+        <register type="NOA" address="0x00009888" value="0x19900157" />
+        <register type="NOA" address="0x00009888" value="0x1B900158" />
+        <register type="NOA" address="0x00009888" value="0x1D900105" />
+        <register type="NOA" address="0x00009888" value="0x1F900103" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x11900FFF" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900800" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900821" />
+        <register type="NOA" address="0x00009888" value="0x47900802" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900802" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900002" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x43900422" />
+        <register type="NOA" address="0x00009888" value="0x53904444" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00000003" />
+        <register type="FLEX" address="0x0000E658" value="0x00002001" />
+        <register type="FLEX" address="0x0000E758" value="0x00778008" />
+        <register type="FLEX" address="0x0000E45C" value="0x00088078" />
+        <register type="FLEX" address="0x0000E55C" value="0x00808708" />
+        <register type="FLEX" address="0x0000E65C" value="0x00222222" />
+    </register_config>
+  </set>
+
+  <set name="Render Metrics for 3D Pipeline Profile Gen9"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="render_pipe_profile"
+       hw_config_guid="9875e050-b1bc-45e6-a6ab-665594601df9"
+       chipset="CFLGT3"
+       symbol_name="RenderPipeProfile"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Bottleneck"
+             low_watermark="10"
+             description="The percentage of time in which vertex shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="30"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_bottleneck"
+             units="percent"
+             symbol_name="VsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Hi-Depth Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which early hierarchical depth test pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="hi_depth_bottleneck"
+             units="percent"
+             symbol_name="HiDepthBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which geometry shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gs_bottleneck"
+             units="percent"
+             symbol_name="GsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Geometry Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="BC Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which barycentric coordinates calculation pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="bc_bottleneck"
+             units="percent"
+             symbol_name="BcBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Barycentric Calc"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HS Stall"
+             description="The percentage of time in which hull stall pipeline stage was stalled."
+             data_type="float"
+             equation="C 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="hs_stall"
+             units="percent"
+             symbol_name="HsStall"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Hull Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="VF Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which vertex fetch pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="C 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vf_bottleneck"
+             units="percent"
+             symbol_name="VfBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Input Assembler"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Strip-Fans Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which strip-fans pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="10"
+             equation="B 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sf_bottleneck"
+             units="percent"
+             symbol_name="SfBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Strip-Fans"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SF Stall"
+             description="The percentage of time in which strip-fans pipeline stage was stalled."
+             data_type="float"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sf_stall"
+             units="percent"
+             symbol_name="SfStall"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Strip-Fans"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HS Bottleneck"
+             low_watermark="3"
+             description="The percentage of time in which hull shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="9"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="hs_bottleneck"
+             units="percent"
+             symbol_name="HsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Hull Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="CL Stall"
+             description="The percentage of time in which clipper pipeline stage was stalled."
+             data_type="float"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="cl_stall"
+             units="percent"
+             symbol_name="ClStall"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Clipper"
+             />
+    <counter name="SO Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which stream output pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="so_bottleneck"
+             units="percent"
+             symbol_name="SoBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Stream Output"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="DS Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which domain shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ds_bottleneck"
+             units="percent"
+             symbol_name="DsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Domain Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Clipper Bottleneck"
+             low_watermark="10"
+             description="The percentage of time in which clipper pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="30"
+             equation="B 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="cl_bottleneck"
+             units="percent"
+             symbol_name="ClBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Clipper"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Stall"
+             description="The percentage of time in which domain shader pipeline stage was stalled."
+             data_type="float"
+             equation="C 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ds_stall"
+             units="percent"
+             symbol_name="DsStall"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Domain Shader"
+             />
+    <counter name="Early Depth Bottleneck"
+             low_watermark="10"
+             description="The percentage of time in which early depth test pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="30"
+             equation="B 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="early_depth_bottleneck"
+             units="percent"
+             symbol_name="EarlyDepthBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="SO Stall"
+             description="The percentage of time in which stream-output pipeline stage was stalled."
+             data_type="float"
+             equation="C 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="so_stall"
+             units="percent"
+             symbol_name="SoStall"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Stream Output"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x0C0E001F" />
+        <register type="NOA" address="0x00009888" value="0x0A0F0000" />
+        <register type="NOA" address="0x00009888" value="0x10116800" />
+        <register type="NOA" address="0x00009888" value="0x178A03E0" />
+        <register type="NOA" address="0x00009888" value="0x11824C00" />
+        <register type="NOA" address="0x00009888" value="0x11830020" />
+        <register type="NOA" address="0x00009888" value="0x13840020" />
+        <register type="NOA" address="0x00009888" value="0x11850019" />
+        <register type="NOA" address="0x00009888" value="0x11860007" />
+        <register type="NOA" address="0x00009888" value="0x01870C40" />
+        <register type="NOA" address="0x00009888" value="0x17880000" />
+        <register type="NOA" address="0x00009888" value="0x022F4000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C0040" />
+        <register type="NOA" address="0x00009888" value="0x0C0D8000" />
+        <register type="NOA" address="0x00009888" value="0x040D4000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x020E5400" />
+        <register type="NOA" address="0x00009888" value="0x000E0000" />
+        <register type="NOA" address="0x00009888" value="0x080F0040" />
+        <register type="NOA" address="0x00009888" value="0x000F0000" />
+        <register type="NOA" address="0x00009888" value="0x100F0000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0040" />
+        <register type="NOA" address="0x00009888" value="0x0C2C8000" />
+        <register type="NOA" address="0x00009888" value="0x06104000" />
+        <register type="NOA" address="0x00009888" value="0x06110012" />
+        <register type="NOA" address="0x00009888" value="0x06131000" />
+        <register type="NOA" address="0x00009888" value="0x01898000" />
+        <register type="NOA" address="0x00009888" value="0x0D890100" />
+        <register type="NOA" address="0x00009888" value="0x03898000" />
+        <register type="NOA" address="0x00009888" value="0x09808000" />
+        <register type="NOA" address="0x00009888" value="0x0B808000" />
+        <register type="NOA" address="0x00009888" value="0x0380C000" />
+        <register type="NOA" address="0x00009888" value="0x0F8A0075" />
+        <register type="NOA" address="0x00009888" value="0x1D8A0000" />
+        <register type="NOA" address="0x00009888" value="0x118A8000" />
+        <register type="NOA" address="0x00009888" value="0x1B8A4000" />
+        <register type="NOA" address="0x00009888" value="0x138A8000" />
+        <register type="NOA" address="0x00009888" value="0x1D81A000" />
+        <register type="NOA" address="0x00009888" value="0x15818000" />
+        <register type="NOA" address="0x00009888" value="0x17818000" />
+        <register type="NOA" address="0x00009888" value="0x0B820030" />
+        <register type="NOA" address="0x00009888" value="0x07828000" />
+        <register type="NOA" address="0x00009888" value="0x0D824000" />
+        <register type="NOA" address="0x00009888" value="0x0F828000" />
+        <register type="NOA" address="0x00009888" value="0x05824000" />
+        <register type="NOA" address="0x00009888" value="0x0D830003" />
+        <register type="NOA" address="0x00009888" value="0x0583000C" />
+        <register type="NOA" address="0x00009888" value="0x09830000" />
+        <register type="NOA" address="0x00009888" value="0x03838000" />
+        <register type="NOA" address="0x00009888" value="0x07838000" />
+        <register type="NOA" address="0x00009888" value="0x0B840980" />
+        <register type="NOA" address="0x00009888" value="0x03844D80" />
+        <register type="NOA" address="0x00009888" value="0x11840000" />
+        <register type="NOA" address="0x00009888" value="0x09848000" />
+        <register type="NOA" address="0x00009888" value="0x09850080" />
+        <register type="NOA" address="0x00009888" value="0x03850003" />
+        <register type="NOA" address="0x00009888" value="0x01850000" />
+        <register type="NOA" address="0x00009888" value="0x07860000" />
+        <register type="NOA" address="0x00009888" value="0x0F860400" />
+        <register type="NOA" address="0x00009888" value="0x09870032" />
+        <register type="NOA" address="0x00009888" value="0x01888052" />
+        <register type="NOA" address="0x00009888" value="0x11880000" />
+        <register type="NOA" address="0x00009888" value="0x09884000" />
+        <register type="NOA" address="0x00009888" value="0x1B931001" />
+        <register type="NOA" address="0x00009888" value="0x1D930001" />
+        <register type="NOA" address="0x00009888" value="0x19934000" />
+        <register type="NOA" address="0x00009888" value="0x1B958000" />
+        <register type="NOA" address="0x00009888" value="0x1D950094" />
+        <register type="NOA" address="0x00009888" value="0x19958000" />
+        <register type="NOA" address="0x00009888" value="0x09E58000" />
+        <register type="NOA" address="0x00009888" value="0x0BE58000" />
+        <register type="NOA" address="0x00009888" value="0x03E5C000" />
+        <register type="NOA" address="0x00009888" value="0x0592C000" />
+        <register type="NOA" address="0x00009888" value="0x0B928000" />
+        <register type="NOA" address="0x00009888" value="0x0D924000" />
+        <register type="NOA" address="0x00009888" value="0x0F924000" />
+        <register type="NOA" address="0x00009888" value="0x11928000" />
+        <register type="NOA" address="0x00009888" value="0x1392C000" />
+        <register type="NOA" address="0x00009888" value="0x09924000" />
+        <register type="NOA" address="0x00009888" value="0x01985000" />
+        <register type="NOA" address="0x00009888" value="0x07988000" />
+        <register type="NOA" address="0x00009888" value="0x09981000" />
+        <register type="NOA" address="0x00009888" value="0x0B982000" />
+        <register type="NOA" address="0x00009888" value="0x0D982000" />
+        <register type="NOA" address="0x00009888" value="0x0F989000" />
+        <register type="NOA" address="0x00009888" value="0x05982000" />
+        <register type="NOA" address="0x00009888" value="0x13904000" />
+        <register type="NOA" address="0x00009888" value="0x21904000" />
+        <register type="NOA" address="0x00009888" value="0x23904000" />
+        <register type="NOA" address="0x00009888" value="0x25908000" />
+        <register type="NOA" address="0x00009888" value="0x27904000" />
+        <register type="NOA" address="0x00009888" value="0x29908000" />
+        <register type="NOA" address="0x00009888" value="0x2B904000" />
+        <register type="NOA" address="0x00009888" value="0x2F904000" />
+        <register type="NOA" address="0x00009888" value="0x31904000" />
+        <register type="NOA" address="0x00009888" value="0x15904000" />
+        <register type="NOA" address="0x00009888" value="0x17908000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B904000" />
+        <register type="NOA" address="0x00009888" value="0x1190C080" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900440" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900400" />
+        <register type="NOA" address="0x00009888" value="0x47900C21" />
+        <register type="NOA" address="0x00009888" value="0x57900400" />
+        <register type="NOA" address="0x00009888" value="0x49900042" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900024" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x43900841" />
+        <register type="NOA" address="0x00009888" value="0x53900400" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007FFEA" />
+        <register type="OA" address="0x00002774" value="0x00007FFC" />
+        <register type="OA" address="0x00002778" value="0x0007AFFA" />
+        <register type="OA" address="0x0000277C" value="0x0000F5FD" />
+        <register type="OA" address="0x00002780" value="0x00079FFA" />
+        <register type="OA" address="0x00002784" value="0x0000F3FB" />
+        <register type="OA" address="0x00002788" value="0x0007BF7A" />
+        <register type="OA" address="0x0000278C" value="0x0000F7E7" />
+        <register type="OA" address="0x00002790" value="0x0007FEFA" />
+        <register type="OA" address="0x00002794" value="0x0000F7CF" />
+        <register type="OA" address="0x00002798" value="0x00077FFA" />
+        <register type="OA" address="0x0000279C" value="0x0000EFDF" />
+        <register type="OA" address="0x000027A0" value="0x0006FFFA" />
+        <register type="OA" address="0x000027A4" value="0x0000CFBF" />
+        <register type="OA" address="0x000027A8" value="0x0003FFFA" />
+        <register type="OA" address="0x000027AC" value="0x00005F7F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00015014" />
+        <register type="FLEX" address="0x0000E658" value="0x00025024" />
+        <register type="FLEX" address="0x0000E758" value="0x00035034" />
+        <register type="FLEX" address="0x0000E45C" value="0x00045044" />
+        <register type="FLEX" address="0x0000E55C" value="0x00055054" />
+        <register type="FLEX" address="0x0000E65C" value="0x00065064" />
+    </register_config>
+  </set>
+
+  <set name="Memory Reads Distribution Gen9"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="memory_reads"
+       hw_config_guid="49c65f34-e625-4ca4-86b7-88693e624d4c"
+       chipset="CFLGT3"
+       symbol_name="MemoryReads"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiL3Bank0Reads"
+             description="The total number of GTI memory reads from L3 Bank 0 (L3 Cache misses)."
+             data_type="uint64"
+             equation="C 4 READ"
+             underscore_name="gti_l3_bank0_reads"
+             units="messages"
+             symbol_name="GtiL3Bank0Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="GtiRingAccesses"
+             description="The total number of all accesses from GTI to the ring."
+             data_type="uint64"
+             equation="C 3 READ 2 UMUL"
+             underscore_name="gti_ring_accesses"
+             units="messages"
+             symbol_name="GtiRingAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="GtiL3Bank3Reads"
+             description="The total number of GTI memory reads from L3 Bank 3 (L3 Cache misses)."
+             data_type="uint64"
+             equation="C 7 READ"
+             underscore_name="gti_l3_bank3_reads"
+             units="messages"
+             symbol_name="GtiL3Bank3Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="GtiRsMemoryReads"
+             description="The total number of GTI memory reads from Resource Streamer."
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="gti_rs_memory_reads"
+             units="messages"
+             symbol_name="GtiRsMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Resource Streamer"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GtiHizMemoryReads"
+             description="The total number of GTI memory reads from Hierarchical Depth Cache (Hi-Depth Cache misses)."
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="gti_hiz_memory_reads"
+             units="messages"
+             symbol_name="GtiHizMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="GtiRccMemoryReads"
+             description="The total number of GTI memory reads from Render Color Cache (Render Color Cache misses)."
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="gti_rcc_memory_reads"
+             units="messages"
+             symbol_name="GtiRccMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Color Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiL3Bank1Reads"
+             description="The total number of GTI memory reads from L3 Bank 1 (L3 Cache misses)."
+             data_type="uint64"
+             equation="C 5 READ"
+             underscore_name="gti_l3_bank1_reads"
+             units="messages"
+             symbol_name="GtiL3Bank1Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiCmdStreamerMemoryReads"
+             description="The total number of GTI memory reads from Command Streamer."
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="gti_cmd_streamer_memory_reads"
+             units="messages"
+             symbol_name="GtiCmdStreamerMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Command Streamer"
+             />
+    <counter name="GtiL3Bank2Reads"
+             description="The total number of GTI memory reads from L3 Bank 2 (L3 Cache misses)."
+             data_type="uint64"
+             equation="C 6 READ"
+             underscore_name="gti_l3_bank2_reads"
+             units="messages"
+             symbol_name="GtiL3Bank2Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiMemoryReads"
+             description="The total number of GTI memory reads."
+             data_type="uint64"
+             equation="C 0 READ"
+             underscore_name="gti_memory_reads"
+             units="messages"
+             symbol_name="GtiMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="GtiRczMemoryReads"
+             description="The total number of GTI memory reads from Render Depth Cache (Render Depth Cache misses)."
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="gti_rcz_memory_reads"
+             units="messages"
+             symbol_name="GtiRczMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="GtiMscMemoryReads"
+             description="The total number of GTI memory reads from Multisampling Color Cache (Multisampling Color Cache misses)."
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="gti_msc_memory_reads"
+             units="messages"
+             symbol_name="GtiMscMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Color Cache"
+             />
+    <counter name="GtiVfMemoryReads"
+             description="The total number of GTI memory reads from Vertex Fetch."
+             data_type="uint64"
+             equation="B 1 READ"
+             underscore_name="gti_vf_memory_reads"
+             units="messages"
+             symbol_name="GtiVfMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Vertex Fetch"
+             />
+    <counter name="GtiStcMemoryReads"
+             description="The total number of GTI memory reads from Stencil Cache (Stencil Cache misses)."
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="gti_stc_memory_reads"
+             units="messages"
+             symbol_name="GtiStcMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiL3Reads"
+             description="The total number of GTI memory reads from L3 (L3 Cache misses)."
+             data_type="uint64"
+             equation="$GtiL3Bank0Reads $GtiL3Bank1Reads $GtiL3Bank2Reads $GtiL3Bank3Reads UADD UADD UADD"
+             underscore_name="gti_l3_reads"
+             units="messages"
+             symbol_name="GtiL3Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x11810C00" />
+        <register type="NOA" address="0x00009888" value="0x1381001A" />
+        <register type="NOA" address="0x00009888" value="0x37906800" />
+        <register type="NOA" address="0x00009888" value="0x3F900064" />
+        <register type="NOA" address="0x00009888" value="0x03811300" />
+        <register type="NOA" address="0x00009888" value="0x05811B12" />
+        <register type="NOA" address="0x00009888" value="0x0781001A" />
+        <register type="NOA" address="0x00009888" value="0x1F810000" />
+        <register type="NOA" address="0x00009888" value="0x17810000" />
+        <register type="NOA" address="0x00009888" value="0x19810000" />
+        <register type="NOA" address="0x00009888" value="0x1B810000" />
+        <register type="NOA" address="0x00009888" value="0x1D810000" />
+        <register type="NOA" address="0x00009888" value="0x1B930055" />
+        <register type="NOA" address="0x00009888" value="0x03E58000" />
+        <register type="NOA" address="0x00009888" value="0x05E5C000" />
+        <register type="NOA" address="0x00009888" value="0x07E54000" />
+        <register type="NOA" address="0x00009888" value="0x13900150" />
+        <register type="NOA" address="0x00009888" value="0x21900151" />
+        <register type="NOA" address="0x00009888" value="0x23900152" />
+        <register type="NOA" address="0x00009888" value="0x25900153" />
+        <register type="NOA" address="0x00009888" value="0x27900154" />
+        <register type="NOA" address="0x00009888" value="0x29900155" />
+        <register type="NOA" address="0x00009888" value="0x2B900156" />
+        <register type="NOA" address="0x00009888" value="0x2D900157" />
+        <register type="NOA" address="0x00009888" value="0x2F90015F" />
+        <register type="NOA" address="0x00009888" value="0x31900105" />
+        <register type="NOA" address="0x00009888" value="0x15900103" />
+        <register type="NOA" address="0x00009888" value="0x17900101" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B908000" />
+        <register type="NOA" address="0x00009888" value="0x1D908000" />
+        <register type="NOA" address="0x00009888" value="0x1F908000" />
+        <register type="NOA" address="0x00009888" value="0x11900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900C60" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900C00" />
+        <register type="NOA" address="0x00009888" value="0x47900C63" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900C63" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900063" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x43900003" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x0000272C" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002728" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x0000271C" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002718" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x0000274C" value="0x86543210" />
+        <register type="OA" address="0x00002748" value="0x86543210" />
+        <register type="OA" address="0x00002744" value="0x00006667" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x0000275C" value="0x86543210" />
+        <register type="OA" address="0x00002758" value="0x86543210" />
+        <register type="OA" address="0x00002754" value="0x00006465" />
+        <register type="OA" address="0x00002750" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007F81A" />
+        <register type="OA" address="0x00002774" value="0x0000FE00" />
+        <register type="OA" address="0x00002778" value="0x0007F82A" />
+        <register type="OA" address="0x0000277C" value="0x0000FE00" />
+        <register type="OA" address="0x00002780" value="0x0007F872" />
+        <register type="OA" address="0x00002784" value="0x0000FE00" />
+        <register type="OA" address="0x00002788" value="0x0007F8BA" />
+        <register type="OA" address="0x0000278C" value="0x0000FE00" />
+        <register type="OA" address="0x00002790" value="0x0007F87A" />
+        <register type="OA" address="0x00002794" value="0x0000FE00" />
+        <register type="OA" address="0x00002798" value="0x0007F8EA" />
+        <register type="OA" address="0x0000279C" value="0x0000FE00" />
+        <register type="OA" address="0x000027A0" value="0x0007F8E2" />
+        <register type="OA" address="0x000027A4" value="0x0000FE00" />
+        <register type="OA" address="0x000027A8" value="0x0007F8F2" />
+        <register type="OA" address="0x000027AC" value="0x0000FE00" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00015014" />
+        <register type="FLEX" address="0x0000E658" value="0x00025024" />
+        <register type="FLEX" address="0x0000E758" value="0x00035034" />
+        <register type="FLEX" address="0x0000E45C" value="0x00045044" />
+        <register type="FLEX" address="0x0000E55C" value="0x00055054" />
+        <register type="FLEX" address="0x0000E65C" value="0x00065064" />
+    </register_config>
+  </set>
+
+  <set name="Memory Writes Distribution Gen9"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="memory_writes"
+       hw_config_guid="45c9e8ee-2998-4d83-88e8-9cb7e03287bf"
+       chipset="CFLGT3"
+       symbol_name="MemoryWrites"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiMemoryWrites"
+             description="The total number of GTI memory writes."
+             data_type="uint64"
+             equation="C 0 READ"
+             underscore_name="gti_memory_writes"
+             units="messages"
+             symbol_name="GtiMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="GtiRingAccesses"
+             description="The total number of all GTI accesses to the ring."
+             data_type="uint64"
+             equation="C 3 READ 2 UMUL"
+             underscore_name="gti_ring_accesses"
+             units="messages"
+             symbol_name="GtiRingAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="GtiMscMemoryWrites"
+             description="The total number of GTI memory writes from Multisampling Color Cache (Multisampling Color Cache invalidations)."
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="gti_msc_memory_writes"
+             units="messages"
+             symbol_name="GtiMscMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Color Cache"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="GtiCmdStreamerMemoryWrites"
+             description="The total number of GTI memory writes from Command Streamer."
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="gti_cmd_streamer_memory_writes"
+             units="messages"
+             symbol_name="GtiCmdStreamerMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Command Streamer"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GtiL3Bank0Writes"
+             description="The total number of GTI memory writes from L3 Bank 0 (L3 Bank 0 invalidations)."
+             data_type="uint64"
+             equation="C 4 READ"
+             underscore_name="gti_l3_bank0_writes"
+             units="messages"
+             symbol_name="GtiL3Bank0Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiL3Bank1Writes"
+             description="The total number of GTI memory writes from L3 Bank 1 (L3 Bank 1 invalidations)."
+             data_type="uint64"
+             equation="C 5 READ"
+             underscore_name="gti_l3_bank1_writes"
+             units="messages"
+             symbol_name="GtiL3Bank1Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiL3Bank2Writes"
+             description="The total number of GTI memory writes from L3 Bank 2 (L3 Bank 2 invalidations)."
+             data_type="uint64"
+             equation="C 6 READ"
+             underscore_name="gti_l3_bank2_writes"
+             units="messages"
+             symbol_name="GtiL3Bank2Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiL3Bank3Writes"
+             description="The total number of GTI memory writes from L3 Bank 3 (L3 Bank 3 invalidations)."
+             data_type="uint64"
+             equation="C 7 READ"
+             underscore_name="gti_l3_bank3_writes"
+             units="messages"
+             symbol_name="GtiL3Bank3Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiL3Writes"
+             description="The total number of GTI memory writes from L3 (L3 invalidations)."
+             data_type="uint64"
+             equation="$GtiL3Bank0Writes $GtiL3Bank1Writes $GtiL3Bank2Writes $GtiL3Bank3Writes UADD UADD UADD"
+             underscore_name="gti_l3_writes"
+             units="messages"
+             symbol_name="GtiL3Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiRccMemoryWrites"
+             description="The total number of GTI memory writes from Render Color Cache (Render Color Cache invalidations)."
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="gti_rcc_memory_writes"
+             units="messages"
+             symbol_name="GtiRccMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Color Cache"
+             />
+    <counter name="GtiSoMemoryWrites"
+             description="The total number of GTI memory writes from Stream Output."
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="gti_so_memory_writes"
+             units="messages"
+             symbol_name="GtiSoMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Stream Output"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiStcMemoryWrites"
+             description="The total number of GTI memory writes from Stencil Cache."
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="gti_stc_memory_writes"
+             units="messages"
+             symbol_name="GtiStcMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="GtiRczMemoryWrites"
+             description="The total number of GTI memory writes from Render Depth Cache."
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="gti_rcz_memory_writes"
+             units="messages"
+             symbol_name="GtiRczMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="GtiHizMemoryWrites"
+             description="The total number of GTI memory writes from Hierarchical Depth Cache."
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="gti_hiz_memory_writes"
+             units="messages"
+             symbol_name="GtiHizMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x11810C00" />
+        <register type="NOA" address="0x00009888" value="0x1381001A" />
+        <register type="NOA" address="0x00009888" value="0x37906800" />
+        <register type="NOA" address="0x00009888" value="0x3F901000" />
+        <register type="NOA" address="0x00009888" value="0x03811300" />
+        <register type="NOA" address="0x00009888" value="0x05811B12" />
+        <register type="NOA" address="0x00009888" value="0x0781001A" />
+        <register type="NOA" address="0x00009888" value="0x1F810000" />
+        <register type="NOA" address="0x00009888" value="0x17810000" />
+        <register type="NOA" address="0x00009888" value="0x19810000" />
+        <register type="NOA" address="0x00009888" value="0x1B810000" />
+        <register type="NOA" address="0x00009888" value="0x1D810000" />
+        <register type="NOA" address="0x00009888" value="0x1B930055" />
+        <register type="NOA" address="0x00009888" value="0x03E58000" />
+        <register type="NOA" address="0x00009888" value="0x05E5C000" />
+        <register type="NOA" address="0x00009888" value="0x07E54000" />
+        <register type="NOA" address="0x00009888" value="0x13900160" />
+        <register type="NOA" address="0x00009888" value="0x21900161" />
+        <register type="NOA" address="0x00009888" value="0x23900162" />
+        <register type="NOA" address="0x00009888" value="0x25900163" />
+        <register type="NOA" address="0x00009888" value="0x27900164" />
+        <register type="NOA" address="0x00009888" value="0x29900165" />
+        <register type="NOA" address="0x00009888" value="0x2B900166" />
+        <register type="NOA" address="0x00009888" value="0x2D900167" />
+        <register type="NOA" address="0x00009888" value="0x2F900150" />
+        <register type="NOA" address="0x00009888" value="0x31900105" />
+        <register type="NOA" address="0x00009888" value="0x15900103" />
+        <register type="NOA" address="0x00009888" value="0x17900101" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B908000" />
+        <register type="NOA" address="0x00009888" value="0x1D908000" />
+        <register type="NOA" address="0x00009888" value="0x1F908000" />
+        <register type="NOA" address="0x00009888" value="0x11900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900C60" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900C00" />
+        <register type="NOA" address="0x00009888" value="0x47900C63" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900C63" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900063" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x43900003" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x0000272C" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002728" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x0000271C" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002718" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x0000274C" value="0x86543210" />
+        <register type="OA" address="0x00002748" value="0x86543210" />
+        <register type="OA" address="0x00002744" value="0x00006667" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x0000275C" value="0x86543210" />
+        <register type="OA" address="0x00002758" value="0x86543210" />
+        <register type="OA" address="0x00002754" value="0x00006465" />
+        <register type="OA" address="0x00002750" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007F81A" />
+        <register type="OA" address="0x00002774" value="0x0000FE00" />
+        <register type="OA" address="0x00002778" value="0x0007F82A" />
+        <register type="OA" address="0x0000277C" value="0x0000FE00" />
+        <register type="OA" address="0x00002780" value="0x0007F822" />
+        <register type="OA" address="0x00002784" value="0x0000FE00" />
+        <register type="OA" address="0x00002788" value="0x0007F8BA" />
+        <register type="OA" address="0x0000278C" value="0x0000FE00" />
+        <register type="OA" address="0x00002790" value="0x0007F87A" />
+        <register type="OA" address="0x00002794" value="0x0000FE00" />
+        <register type="OA" address="0x00002798" value="0x0007F8EA" />
+        <register type="OA" address="0x0000279C" value="0x0000FE00" />
+        <register type="OA" address="0x000027A0" value="0x0007F8E2" />
+        <register type="OA" address="0x000027A4" value="0x0000FE00" />
+        <register type="OA" address="0x000027A8" value="0x0007F8F2" />
+        <register type="OA" address="0x000027AC" value="0x0000FE00" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00015014" />
+        <register type="FLEX" address="0x0000E658" value="0x00025024" />
+        <register type="FLEX" address="0x0000E758" value="0x00035034" />
+        <register type="FLEX" address="0x0000E45C" value="0x00045044" />
+        <register type="FLEX" address="0x0000E55C" value="0x00055054" />
+        <register type="FLEX" address="0x0000E65C" value="0x00065064" />
+    </register_config>
+  </set>
+
+  <set name="Compute Metrics Extended Gen9"
+       mdapi_supported_apis="VK OGL4 OCL IO BB"
+       underscore_name="compute_extended"
+       hw_config_guid="bac415ce-d7a2-4f8d-9b16-834deba7330e"
+       chipset="CFLGT3"
+       symbol_name="ComputeExtended"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu0_active"
+             units="percent"
+             symbol_name="Fpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active"
+             units="percent"
+             symbol_name="Fpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU AVG IPC Rate"
+             description="The average rate of IPC calculated for 2 FPU pipelines."
+             data_type="float"
+             max_equation="2"
+             equation="A 9 READ  A 10 READ  A 11 READ UADD  A 9 READ USUB FDIV 1 FADD"
+             underscore_name="eu_avg_ipc_rate"
+             units="number"
+             symbol_name="EuAvgIpcRate"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Typed Writes 0"
+             description="The subslice 0 typed writes."
+             data_type="uint64"
+             equation="C 0 READ"
+             underscore_name="typed_writes0"
+             units="messages"
+             symbol_name="TypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuTypedAtomics0"
+             description="The subslice 0 EU Typed Atomics subslice 0."
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="eu_typed_atomics0"
+             units="messages"
+             symbol_name="EuTypedAtomics0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Typed Atomics 0"
+             description="The subslice 0 typed atomics."
+             data_type="uint64"
+             equation="C 4 READ"
+             underscore_name="typed_atomics0"
+             units="messages"
+             symbol_name="TypedAtomics0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="TypedAtomicsPerCacheLine"
+             description="The ratio of EU typed atomics requests to L3 cache line writes."
+             data_type="float"
+             equation="$EuTypedAtomics0 $TypedAtomics0 FDIV"
+             underscore_name="typed_atomics_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="TypedAtomicsPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuUntypedReads0"
+             description="The subslice 0 EU Untyped Reads subslice 0."
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="eu_untyped_reads0"
+             units="messages"
+             symbol_name="EuUntypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Untyped Writes 0"
+             description="The subslice 0 untyped writes (including SLM writes)."
+             data_type="uint64"
+             equation="C 1 READ"
+             underscore_name="untyped_writes0"
+             units="messages"
+             symbol_name="UntypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuUntypedAtomics0"
+             description="The subslice 0 EU Untyped Atomics subslice 0."
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="eu_untyped_atomics0"
+             units="messages"
+             symbol_name="EuUntypedAtomics0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuUntypedWrites0"
+             description="The subslice 0 EU Untyped Writes subslice 0."
+             data_type="uint64"
+             equation="B 1 READ"
+             underscore_name="eu_untyped_writes0"
+             units="messages"
+             symbol_name="EuUntypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuA64UntypedWrites0"
+             description="The subslice 0 EU A64 Untyped Writes subslice 0."
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="eu_a64_untyped_writes0"
+             units="messages"
+             symbol_name="EuA64UntypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="UntypedWritesPerCacheLine"
+             description="The ratio of EU untyped write requests to L3 cache line writes."
+             data_type="float"
+             equation="$EuUntypedWrites0 $EuA64UntypedWrites0 UADD $UntypedWrites0 FDIV"
+             underscore_name="untyped_writes_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="UntypedWritesPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EuTypedWrites0"
+             description="The subslice 0 EU Typed Writes subslice 0."
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="eu_typed_writes0"
+             units="messages"
+             symbol_name="EuTypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="TypedWritesPerCacheLine"
+             description="The ratio of EU typed write requests to L3 cache line writes."
+             data_type="float"
+             equation="$EuTypedWrites0 $TypedWrites0 FDIV"
+             underscore_name="typed_writes_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="TypedWritesPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Typed Reads 0"
+             description="The subslice 0 typed reads."
+             data_type="uint64"
+             equation="C 2 READ"
+             underscore_name="typed_reads0"
+             units="messages"
+             symbol_name="TypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Untyped Reads 0"
+             description="The subslice 0 untyped reads (including SLM reads)."
+             data_type="uint64"
+             equation="C 3 READ"
+             underscore_name="untyped_reads0"
+             units="messages"
+             symbol_name="UntypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuA64UntypedReads0"
+             description="The subslice 0 EU A64 Untyped Reads subslice 0."
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="eu_a64_untyped_reads0"
+             units="messages"
+             symbol_name="EuA64UntypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EU Thread Occupancy"
+             description="The percentage of time in which hardware threads occupied EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ 8 UMUL $EuCoresTotalCount UDIV $EuThreadsCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_thread_occupancy"
+             units="percent"
+             symbol_name="EuThreadOccupancy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EuTypedReads0"
+             description="The subslice 0 EU Typed Reads subslice 0."
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="eu_typed_reads0"
+             units="messages"
+             symbol_name="EuTypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="UntypedReadsPerCacheLine"
+             description="The ratio of EU untyped read requests to L3 cache line reads."
+             data_type="float"
+             equation="$EuUntypedReads0 $EuA64UntypedReads0 UADD $UntypedReads0 FDIV"
+             underscore_name="untyped_reads_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="UntypedReadsPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="TypedReadsPerCacheLine"
+             description="The ratio of EU typed read requests to L3 cache line reads."
+             data_type="float"
+             equation="$EuTypedReads0 $TypedReads0 FDIV"
+             underscore_name="typed_reads_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="TypedReadsPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="EU Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_send_active"
+             units="percent"
+             symbol_name="EuSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x106C00E0" />
+        <register type="NOA" address="0x00009888" value="0x141C8160" />
+        <register type="NOA" address="0x00009888" value="0x161C8015" />
+        <register type="NOA" address="0x00009888" value="0x181C0120" />
+        <register type="NOA" address="0x00009888" value="0x004E8000" />
+        <register type="NOA" address="0x00009888" value="0x0E4E8000" />
+        <register type="NOA" address="0x00009888" value="0x184E8000" />
+        <register type="NOA" address="0x00009888" value="0x1A4EAAA0" />
+        <register type="NOA" address="0x00009888" value="0x1C4E0002" />
+        <register type="NOA" address="0x00009888" value="0x024E8000" />
+        <register type="NOA" address="0x00009888" value="0x044E8000" />
+        <register type="NOA" address="0x00009888" value="0x064E8000" />
+        <register type="NOA" address="0x00009888" value="0x084E8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4E8000" />
+        <register type="NOA" address="0x00009888" value="0x0E6C0B01" />
+        <register type="NOA" address="0x00009888" value="0x006C0200" />
+        <register type="NOA" address="0x00009888" value="0x026C000C" />
+        <register type="NOA" address="0x00009888" value="0x1C6C0000" />
+        <register type="NOA" address="0x00009888" value="0x1E6C0000" />
+        <register type="NOA" address="0x00009888" value="0x1A6C0000" />
+        <register type="NOA" address="0x00009888" value="0x0E1BC000" />
+        <register type="NOA" address="0x00009888" value="0x001B8000" />
+        <register type="NOA" address="0x00009888" value="0x021BC000" />
+        <register type="NOA" address="0x00009888" value="0x001C0041" />
+        <register type="NOA" address="0x00009888" value="0x061C4200" />
+        <register type="NOA" address="0x00009888" value="0x081C4443" />
+        <register type="NOA" address="0x00009888" value="0x0A1C4645" />
+        <register type="NOA" address="0x00009888" value="0x0C1C7647" />
+        <register type="NOA" address="0x00009888" value="0x041C7357" />
+        <register type="NOA" address="0x00009888" value="0x1C1C0030" />
+        <register type="NOA" address="0x00009888" value="0x101C0000" />
+        <register type="NOA" address="0x00009888" value="0x1A1C0000" />
+        <register type="NOA" address="0x00009888" value="0x121C8000" />
+        <register type="NOA" address="0x00009888" value="0x004C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4CAA2A" />
+        <register type="NOA" address="0x00009888" value="0x0C4C02AA" />
+        <register type="NOA" address="0x00009888" value="0x084CA000" />
+        <register type="NOA" address="0x00009888" value="0x000DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D8000" />
+        <register type="NOA" address="0x00009888" value="0x080DA000" />
+        <register type="NOA" address="0x00009888" value="0x0A0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0E0DA000" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F5400" />
+        <register type="NOA" address="0x00009888" value="0x0E0F5515" />
+        <register type="NOA" address="0x00009888" value="0x100F0155" />
+        <register type="NOA" address="0x00009888" value="0x002C8000" />
+        <register type="NOA" address="0x00009888" value="0x0E2C8000" />
+        <register type="NOA" address="0x00009888" value="0x162CAA00" />
+        <register type="NOA" address="0x00009888" value="0x182C00AA" />
+        <register type="NOA" address="0x00009888" value="0x022C8000" />
+        <register type="NOA" address="0x00009888" value="0x042C8000" />
+        <register type="NOA" address="0x00009888" value="0x062C8000" />
+        <register type="NOA" address="0x00009888" value="0x082C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x11907FFF" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900040" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900802" />
+        <register type="NOA" address="0x00009888" value="0x47900842" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900842" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900000" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x43900800" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007FC2A" />
+        <register type="OA" address="0x00002774" value="0x0000BF00" />
+        <register type="OA" address="0x00002778" value="0x0007FC6A" />
+        <register type="OA" address="0x0000277C" value="0x0000BF00" />
+        <register type="OA" address="0x00002780" value="0x0007FC92" />
+        <register type="OA" address="0x00002784" value="0x0000BF00" />
+        <register type="OA" address="0x00002788" value="0x0007FCA2" />
+        <register type="OA" address="0x0000278C" value="0x0000BF00" />
+        <register type="OA" address="0x00002790" value="0x0007FC32" />
+        <register type="OA" address="0x00002794" value="0x0000BF00" />
+        <register type="OA" address="0x00002798" value="0x0007FC9A" />
+        <register type="OA" address="0x0000279C" value="0x0000BF00" />
+        <register type="OA" address="0x000027A0" value="0x0007FE6A" />
+        <register type="OA" address="0x000027A4" value="0x0000BF00" />
+        <register type="OA" address="0x000027A8" value="0x0007FE7A" />
+        <register type="OA" address="0x000027AC" value="0x0000BF00" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00000003" />
+        <register type="FLEX" address="0x0000E658" value="0x00002001" />
+        <register type="FLEX" address="0x0000E758" value="0x00778008" />
+        <register type="FLEX" address="0x0000E45C" value="0x00088078" />
+        <register type="FLEX" address="0x0000E55C" value="0x00808708" />
+        <register type="FLEX" address="0x0000E65C" value="0x00A08908" />
+    </register_config>
+  </set>
+
+  <set name="Compute Metrics L3 Cache Gen9"
+       mdapi_supported_apis="VK OGL4 OCL IO BB"
+       underscore_name="compute_l3_cache"
+       hw_config_guid="a8cfca44-0e74-4338-9e57-3daad98957dd"
+       chipset="CFLGT3"
+       symbol_name="ComputeL3Cache"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Bank 03 Accesses"
+             description="The total number of accesses to L3 Bank 03."
+             data_type="uint64"
+             equation="B 3 READ 2 UMUL"
+             underscore_name="l3_bank03_accesses"
+             units="messages"
+             symbol_name="L3Bank03Accesses"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="L3 Accesses"
+             description="The total number of L3 accesses from all entities."
+             data_type="uint64"
+             equation="C 0 READ C 1 READ B 2 READ B 3 READ UADD UADD UADD 2 UMUL"
+             underscore_name="l3_accesses"
+             units="messages"
+             symbol_name="L3Accesses"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Sampler Throughput"
+             description="The total number of GPU memory bytes transferred between samplers and L3 caches."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 29 READ 64 UMUL"
+             underscore_name="l3_sampler_throughput"
+             units="bytes"
+             symbol_name="L3SamplerThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Sampler"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu0_active"
+             units="percent"
+             symbol_name="Fpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active"
+             units="percent"
+             symbol_name="Fpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU AVG IPC Rate"
+             description="The average rate of IPC calculated for 2 FPU pipelines."
+             data_type="float"
+             max_equation="2"
+             equation="A 9 READ  A 10 READ  A 11 READ UADD  A 9 READ USUB FDIV 1 FADD"
+             underscore_name="eu_avg_ipc_rate"
+             units="number"
+             symbol_name="EuAvgIpcRate"
+             semantic_type="ratio"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Binary Instruction"
+             description="The percentage of time in which execution units were actively processing binary instructions on FPU0."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_binary_fpu0_instruction"
+             units="percent"
+             symbol_name="EuBinaryFpu0Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="EU FPU0 Hybrid Instruction"
+             description="The percentage of time in which execution units were actively processing hybrid instructions on FPU0."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_hybrid_fpu0_instruction"
+             units="percent"
+             symbol_name="EuHybridFpu0Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Misses"
+             description="The total number of L3 misses."
+             data_type="uint64"
+             equation="C 4 READ C 5 READ UADD"
+             underscore_name="l3_misses"
+             units="messages"
+             symbol_name="L3Misses"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/TAG"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="L3 Bank 00 Accesses"
+             description="The total number of accesses to L3 Bank 00."
+             data_type="uint64"
+             equation="C 0 READ 2 UMUL"
+             underscore_name="l3_bank00_accesses"
+             units="messages"
+             symbol_name="L3Bank00Accesses"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="EU FPU0 Move Instruction"
+             description="The percentage of time in which execution units were actively processing move instructions on FPU0."
+             data_type="float"
+             max_equation="100"
+             equation="A 19 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_move_fpu0_instruction"
+             units="percent"
+             symbol_name="EuMoveFpu0Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU FPU1 Hybrid Instruction"
+             description="The percentage of time in which execution units were actively processing hybrid instructions on FPU1."
+             data_type="float"
+             max_equation="100"
+             equation="A 14 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_hybrid_fpu1_instruction"
+             units="percent"
+             symbol_name="EuHybridFpu1Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Read Throughput"
+             description="The total number of GPU memory bytes read from GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="C 6 READ 64 UMUL"
+             underscore_name="gti_read_throughput"
+             units="bytes"
+             symbol_name="GtiReadThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI L3 Throughput"
+             description="The total number of GPU memory bytes transferred between L3 caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 4 READ C 5 READ UADD 64 UMUL"
+             underscore_name="gti_l3_throughput"
+             units="bytes"
+             symbol_name="GtiL3Throughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Bank 00 IC Accesses"
+             description="The total number of accesses to L3 Bank 00 from IC cache."
+             data_type="uint64"
+             equation="B 0 READ B 1 READ UADD 2 UMUL $L3Bank00Accesses UMIN"
+             underscore_name="l3_bank00_ic_accesses"
+             units="messages"
+             symbol_name="L3Bank00IcAccesses"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3/IC"
+             />
+    <counter name="L3 Bank 00 IC Hits"
+             description="The total number of hits in L3 Bank 00 from IC cache."
+             data_type="uint64"
+             equation="B 1 READ 2 UMUL $L3Bank00IcAccesses UMIN"
+             underscore_name="l3_bank00_ic_hits"
+             units="messages"
+             symbol_name="L3Bank00IcHits"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3/IC"
+             />
+    <counter name="Sampler Accesses"
+             description="The total number of messages send to samplers."
+             data_type="uint64"
+             equation="A 28 READ"
+             underscore_name="sampler_accesses"
+             units="messages"
+             symbol_name="SamplerAccesses"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler"
+             />
+    <counter name="L3 Bank 01 Accesses"
+             description="The total number of accesses to L3 Bank 01."
+             data_type="uint64"
+             equation="C 1 READ 2 UMUL"
+             underscore_name="l3_bank01_accesses"
+             units="messages"
+             symbol_name="L3Bank01Accesses"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Ternary Instruction"
+             description="The percentage of time in which execution units were actively processing ternary instructions on FPU0."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_ternary_fpu0_instruction"
+             units="percent"
+             symbol_name="EuTernaryFpu0Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU FPU1 Move Instruction"
+             description="The percentage of time in which execution units were actively processing move instructions on FPU1."
+             data_type="float"
+             max_equation="100"
+             equation="A 20 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_move_fpu1_instruction"
+             units="percent"
+             symbol_name="EuMoveFpu1Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="L3 Bank 02 Accesses"
+             description="The total number of accesses to L3 Bank 02."
+             data_type="uint64"
+             equation="B 2 READ 2 UMUL"
+             underscore_name="l3_bank02_accesses"
+             units="messages"
+             symbol_name="L3Bank02Accesses"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="L3 Total Throughput"
+             description="The total number of GPU memory bytes transferred via L3."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="$L3Accesses 64 UMUL"
+             underscore_name="l3_total_throughput"
+             units="bytes"
+             symbol_name="L3TotalThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Write Throughput"
+             description="The total number of GPU memory bytes written to GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 32 UMUL"
+             equation="C 7 READ 64 UMUL"
+             underscore_name="gti_write_throughput"
+             units="bytes"
+             symbol_name="GtiWriteThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="EU FPU1 Binary Instruction"
+             description="The percentage of time in which execution units were actively processing binary instructions on FPU1."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_binary_fpu1_instruction"
+             units="percent"
+             symbol_name="EuBinaryFpu1Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Ternary Instruction"
+             description="The percentage of time in which execution units were actively processing ternary instructions on FPU1."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_ternary_fpu1_instruction"
+             units="percent"
+             symbol_name="EuTernaryFpu1Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_send_active"
+             units="percent"
+             symbol_name="EuSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x166C0760" />
+        <register type="NOA" address="0x00009888" value="0x1593001E" />
+        <register type="NOA" address="0x00009888" value="0x3F900003" />
+        <register type="NOA" address="0x00009888" value="0x004E8000" />
+        <register type="NOA" address="0x00009888" value="0x0E4E8000" />
+        <register type="NOA" address="0x00009888" value="0x184E8000" />
+        <register type="NOA" address="0x00009888" value="0x1A4E8020" />
+        <register type="NOA" address="0x00009888" value="0x1C4E0002" />
+        <register type="NOA" address="0x00009888" value="0x006C0051" />
+        <register type="NOA" address="0x00009888" value="0x066C5000" />
+        <register type="NOA" address="0x00009888" value="0x086C5C5D" />
+        <register type="NOA" address="0x00009888" value="0x0E6C5E5F" />
+        <register type="NOA" address="0x00009888" value="0x106C0000" />
+        <register type="NOA" address="0x00009888" value="0x186C0000" />
+        <register type="NOA" address="0x00009888" value="0x1C6C0000" />
+        <register type="NOA" address="0x00009888" value="0x1E6C0000" />
+        <register type="NOA" address="0x00009888" value="0x001B4000" />
+        <register type="NOA" address="0x00009888" value="0x061B8000" />
+        <register type="NOA" address="0x00009888" value="0x081BC000" />
+        <register type="NOA" address="0x00009888" value="0x0E1BC000" />
+        <register type="NOA" address="0x00009888" value="0x101C8000" />
+        <register type="NOA" address="0x00009888" value="0x1A1CE000" />
+        <register type="NOA" address="0x00009888" value="0x1C1C0030" />
+        <register type="NOA" address="0x00009888" value="0x004C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C2A00" />
+        <register type="NOA" address="0x00009888" value="0x0C4C0280" />
+        <register type="NOA" address="0x00009888" value="0x000D2000" />
+        <register type="NOA" address="0x00009888" value="0x060D8000" />
+        <register type="NOA" address="0x00009888" value="0x080DA000" />
+        <register type="NOA" address="0x00009888" value="0x0E0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F0400" />
+        <register type="NOA" address="0x00009888" value="0x0E0F1500" />
+        <register type="NOA" address="0x00009888" value="0x100F0140" />
+        <register type="NOA" address="0x00009888" value="0x002C8000" />
+        <register type="NOA" address="0x00009888" value="0x0E2C8000" />
+        <register type="NOA" address="0x00009888" value="0x162C0A00" />
+        <register type="NOA" address="0x00009888" value="0x182C00A0" />
+        <register type="NOA" address="0x00009888" value="0x03933300" />
+        <register type="NOA" address="0x00009888" value="0x05930032" />
+        <register type="NOA" address="0x00009888" value="0x11930000" />
+        <register type="NOA" address="0x00009888" value="0x1B930000" />
+        <register type="NOA" address="0x00009888" value="0x1D900157" />
+        <register type="NOA" address="0x00009888" value="0x1F900158" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B908000" />
+        <register type="NOA" address="0x00009888" value="0x1190030F" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900000" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900021" />
+        <register type="NOA" address="0x00009888" value="0x47900000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900000" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x53904444" />
+        <register type="NOA" address="0x00009888" value="0x43900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x30800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x30800000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007FFFA" />
+        <register type="OA" address="0x00002774" value="0x0000FEFE" />
+        <register type="OA" address="0x00002778" value="0x0007FFFA" />
+        <register type="OA" address="0x0000277C" value="0x0000FEFD" />
+        <register type="OA" address="0x00002790" value="0x0007FFFA" />
+        <register type="OA" address="0x00002794" value="0x0000FBEF" />
+        <register type="OA" address="0x00002798" value="0x0007FFFA" />
+        <register type="OA" address="0x0000279C" value="0x0000FBDF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00000003" />
+        <register type="FLEX" address="0x0000E658" value="0x00002001" />
+        <register type="FLEX" address="0x0000E758" value="0x00101100" />
+        <register type="FLEX" address="0x0000E45C" value="0x00201200" />
+        <register type="FLEX" address="0x0000E55C" value="0x00301300" />
+        <register type="FLEX" address="0x0000E65C" value="0x00401400" />
+    </register_config>
+  </set>
+
+  <set name="Metric set HDCAndSF"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="hdc_and_sf"
+       hw_config_guid="c4bee67c-0de6-4bc2-9900-5388dcc8adca"
+       chipset="CFLGT3"
+       symbol_name="HDCAndSF"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="Polygon Data Ready"
+             description="The percentage of time in which geometry pipeline output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="poly_data_ready"
+             units="percent"
+             symbol_name="PolyDataReady"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe/Strip-Fans"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="HDC stalled by L3 (s0.ss1)"
+             description="Percentage of time when HDC has messges to L3, but it's stalled due to lack of credits (s0.ss1)"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ C 4 READ USUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader01_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader01AccessStalledOnL3"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="HDC stalled by L3 (s0.ss2)"
+             description="Percentage of time when HDC has messges to L3, but it's stalled due to lack of credits (s0.ss2)"
+             data_type="float"
+             max_equation="100"
+             equation="C 3 READ C 2 READ USUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader02_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader02AccessStalledOnL3"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="HDC stalled by L3 (s0.ss0)"
+             description="Percentage of time when HDC has messges to L3, but it's stalled due to lack of credits (s0.ss0)"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ C 6 READ USUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader00_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader00AccessStalledOnL3"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x104F0232" />
+        <register type="NOA" address="0x00009888" value="0x124F4640" />
+        <register type="NOA" address="0x00009888" value="0x106C0232" />
+        <register type="NOA" address="0x00009888" value="0x11834400" />
+        <register type="NOA" address="0x00009888" value="0x0A4E8000" />
+        <register type="NOA" address="0x00009888" value="0x0C4E8000" />
+        <register type="NOA" address="0x00009888" value="0x004F1880" />
+        <register type="NOA" address="0x00009888" value="0x024F08BB" />
+        <register type="NOA" address="0x00009888" value="0x044F001B" />
+        <register type="NOA" address="0x00009888" value="0x046C0100" />
+        <register type="NOA" address="0x00009888" value="0x066C000B" />
+        <register type="NOA" address="0x00009888" value="0x1A6C0000" />
+        <register type="NOA" address="0x00009888" value="0x041B8000" />
+        <register type="NOA" address="0x00009888" value="0x061B4000" />
+        <register type="NOA" address="0x00009888" value="0x1A1C1800" />
+        <register type="NOA" address="0x00009888" value="0x005B8000" />
+        <register type="NOA" address="0x00009888" value="0x025BC000" />
+        <register type="NOA" address="0x00009888" value="0x045B4000" />
+        <register type="NOA" address="0x00009888" value="0x125C8000" />
+        <register type="NOA" address="0x00009888" value="0x145C8000" />
+        <register type="NOA" address="0x00009888" value="0x165C8000" />
+        <register type="NOA" address="0x00009888" value="0x185C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C00A0" />
+        <register type="NOA" address="0x00009888" value="0x000D8000" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F5000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0055" />
+        <register type="NOA" address="0x00009888" value="0x022CC000" />
+        <register type="NOA" address="0x00009888" value="0x042CC000" />
+        <register type="NOA" address="0x00009888" value="0x062CC000" />
+        <register type="NOA" address="0x00009888" value="0x082CC000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0F828000" />
+        <register type="NOA" address="0x00009888" value="0x0F8305C0" />
+        <register type="NOA" address="0x00009888" value="0x09830000" />
+        <register type="NOA" address="0x00009888" value="0x07830000" />
+        <register type="NOA" address="0x00009888" value="0x1D950080" />
+        <register type="NOA" address="0x00009888" value="0x13928000" />
+        <register type="NOA" address="0x00009888" value="0x0F988000" />
+        <register type="NOA" address="0x00009888" value="0x31904000" />
+        <register type="NOA" address="0x00009888" value="0x1190FC00" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900040" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900800" />
+        <register type="NOA" address="0x00009888" value="0x43900842" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x10800000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00000002" />
+        <register type="OA" address="0x00002774" value="0x0000FDFF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set L3_1"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="l3_1"
+       hw_config_guid="2f77a650-54a6-4777-98dc-e49000c13ceb"
+       chipset="CFLGT3"
+       symbol_name="L3_1"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank1 Active"
+             description="The percentage of time in which slice0 L3 bank1 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank1_active"
+             units="percent"
+             symbol_name="L30Bank1Active"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="Slice0 L3 Bank1 Stalled"
+             description="The percentage of time in which slice0 L3 bank1 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank1_stalled"
+             units="percent"
+             symbol_name="L30Bank1Stalled"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank0 Active"
+             description="The percentage of time in which slice0 L3 bank0 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank0_active"
+             units="percent"
+             symbol_name="L30Bank0Active"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank0 Stalled"
+             description="The percentage of time in which slice0 L3 bank0 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank0_stalled"
+             units="percent"
+             symbol_name="L30Bank0Stalled"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x126C7B40" />
+        <register type="NOA" address="0x00009888" value="0x166C0020" />
+        <register type="NOA" address="0x00009888" value="0x0A603444" />
+        <register type="NOA" address="0x00009888" value="0x0A613400" />
+        <register type="NOA" address="0x00009888" value="0x1A4EA800" />
+        <register type="NOA" address="0x00009888" value="0x1C4E0002" />
+        <register type="NOA" address="0x00009888" value="0x024E8000" />
+        <register type="NOA" address="0x00009888" value="0x044E8000" />
+        <register type="NOA" address="0x00009888" value="0x064E8000" />
+        <register type="NOA" address="0x00009888" value="0x084E8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4E8000" />
+        <register type="NOA" address="0x00009888" value="0x064F4000" />
+        <register type="NOA" address="0x00009888" value="0x0C6C5327" />
+        <register type="NOA" address="0x00009888" value="0x0E6C5425" />
+        <register type="NOA" address="0x00009888" value="0x006C2A00" />
+        <register type="NOA" address="0x00009888" value="0x026C285B" />
+        <register type="NOA" address="0x00009888" value="0x046C005C" />
+        <register type="NOA" address="0x00009888" value="0x106C0000" />
+        <register type="NOA" address="0x00009888" value="0x1C6C0000" />
+        <register type="NOA" address="0x00009888" value="0x1E6C0000" />
+        <register type="NOA" address="0x00009888" value="0x1A6C0800" />
+        <register type="NOA" address="0x00009888" value="0x0C1BC000" />
+        <register type="NOA" address="0x00009888" value="0x0E1BC000" />
+        <register type="NOA" address="0x00009888" value="0x001B8000" />
+        <register type="NOA" address="0x00009888" value="0x021BC000" />
+        <register type="NOA" address="0x00009888" value="0x041BC000" />
+        <register type="NOA" address="0x00009888" value="0x1C1C003C" />
+        <register type="NOA" address="0x00009888" value="0x121C8000" />
+        <register type="NOA" address="0x00009888" value="0x141C8000" />
+        <register type="NOA" address="0x00009888" value="0x161C8000" />
+        <register type="NOA" address="0x00009888" value="0x181C8000" />
+        <register type="NOA" address="0x00009888" value="0x1A1C0800" />
+        <register type="NOA" address="0x00009888" value="0x065B4000" />
+        <register type="NOA" address="0x00009888" value="0x1A5C1000" />
+        <register type="NOA" address="0x00009888" value="0x10600000" />
+        <register type="NOA" address="0x00009888" value="0x04600000" />
+        <register type="NOA" address="0x00009888" value="0x0C610044" />
+        <register type="NOA" address="0x00009888" value="0x10610000" />
+        <register type="NOA" address="0x00009888" value="0x06610000" />
+        <register type="NOA" address="0x00009888" value="0x0C4C02A8" />
+        <register type="NOA" address="0x00009888" value="0x084CA000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C002A" />
+        <register type="NOA" address="0x00009888" value="0x0C0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0E0DA000" />
+        <register type="NOA" address="0x00009888" value="0x000D8000" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x100F0154" />
+        <register type="NOA" address="0x00009888" value="0x0C0F5000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0055" />
+        <register type="NOA" address="0x00009888" value="0x182C00AA" />
+        <register type="NOA" address="0x00009888" value="0x022C8000" />
+        <register type="NOA" address="0x00009888" value="0x042C8000" />
+        <register type="NOA" address="0x00009888" value="0x062C8000" />
+        <register type="NOA" address="0x00009888" value="0x082C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C2CC000" />
+        <register type="NOA" address="0x00009888" value="0x1190FFC0" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900420" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900021" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900400" />
+        <register type="NOA" address="0x00009888" value="0x43900421" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900040" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002770" value="0x00100070" />
+        <register type="OA" address="0x00002774" value="0x0000FFF1" />
+        <register type="OA" address="0x00002778" value="0x00014002" />
+        <register type="OA" address="0x0000277C" value="0x0000C3FF" />
+        <register type="OA" address="0x00002780" value="0x00010002" />
+        <register type="OA" address="0x00002784" value="0x0000C7FF" />
+        <register type="OA" address="0x00002788" value="0x00004002" />
+        <register type="OA" address="0x0000278C" value="0x0000D3FF" />
+        <register type="OA" address="0x00002790" value="0x00100700" />
+        <register type="OA" address="0x00002794" value="0x0000FF1F" />
+        <register type="OA" address="0x00002798" value="0x00001402" />
+        <register type="OA" address="0x0000279C" value="0x0000FC3F" />
+        <register type="OA" address="0x000027A0" value="0x00001002" />
+        <register type="OA" address="0x000027A4" value="0x0000FC7F" />
+        <register type="OA" address="0x000027A8" value="0x00000402" />
+        <register type="OA" address="0x000027AC" value="0x0000FD3F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set L3_2"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="l3_2"
+       hw_config_guid="61cf6b31-9ddd-4deb-bae5-7339dd1f63b3"
+       chipset="CFLGT3"
+       symbol_name="L3_2"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank2 Stalled"
+             description="The percentage of time in which slice0 L3 bank2 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank2_stalled"
+             units="percent"
+             symbol_name="L30Bank2Stalled"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank2 Active"
+             description="The percentage of time in which slice0 L3 bank2 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank2_active"
+             units="percent"
+             symbol_name="L30Bank2Active"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x126C02E0" />
+        <register type="NOA" address="0x00009888" value="0x146C0001" />
+        <register type="NOA" address="0x00009888" value="0x0A623400" />
+        <register type="NOA" address="0x00009888" value="0x044E8000" />
+        <register type="NOA" address="0x00009888" value="0x064E8000" />
+        <register type="NOA" address="0x00009888" value="0x084E8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4E8000" />
+        <register type="NOA" address="0x00009888" value="0x064F4000" />
+        <register type="NOA" address="0x00009888" value="0x026C3324" />
+        <register type="NOA" address="0x00009888" value="0x046C3422" />
+        <register type="NOA" address="0x00009888" value="0x106C0000" />
+        <register type="NOA" address="0x00009888" value="0x1A6C0000" />
+        <register type="NOA" address="0x00009888" value="0x021BC000" />
+        <register type="NOA" address="0x00009888" value="0x041BC000" />
+        <register type="NOA" address="0x00009888" value="0x141C8000" />
+        <register type="NOA" address="0x00009888" value="0x161C8000" />
+        <register type="NOA" address="0x00009888" value="0x181C8000" />
+        <register type="NOA" address="0x00009888" value="0x1A1C0800" />
+        <register type="NOA" address="0x00009888" value="0x065B4000" />
+        <register type="NOA" address="0x00009888" value="0x1A5C1000" />
+        <register type="NOA" address="0x00009888" value="0x06614000" />
+        <register type="NOA" address="0x00009888" value="0x0C620044" />
+        <register type="NOA" address="0x00009888" value="0x10620000" />
+        <register type="NOA" address="0x00009888" value="0x06620000" />
+        <register type="NOA" address="0x00009888" value="0x084C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C002A" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F4000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0055" />
+        <register type="NOA" address="0x00009888" value="0x042C8000" />
+        <register type="NOA" address="0x00009888" value="0x062C8000" />
+        <register type="NOA" address="0x00009888" value="0x082C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C2CC000" />
+        <register type="NOA" address="0x00009888" value="0x1190F800" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x43900000" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00100070" />
+        <register type="OA" address="0x00002774" value="0x0000FFF1" />
+        <register type="OA" address="0x00002778" value="0x00028002" />
+        <register type="OA" address="0x0000277C" value="0x000087FF" />
+        <register type="OA" address="0x00002780" value="0x00020002" />
+        <register type="OA" address="0x00002784" value="0x00008FFF" />
+        <register type="OA" address="0x00002788" value="0x00008002" />
+        <register type="OA" address="0x0000278C" value="0x0000A7FF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set L3_3"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="l3_3"
+       hw_config_guid="1421ea8b-a4c9-4383-922a-60ba96c42f24"
+       chipset="CFLGT3"
+       symbol_name="L3_3"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Slice0 L3 Bank3 Stalled"
+             description="The percentage of time in which slice0 L3 bank3 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank3_stalled"
+             units="percent"
+             symbol_name="L30Bank3Stalled"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank3 Active"
+             description="The percentage of time in which slice0 L3 bank3 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank3_active"
+             units="percent"
+             symbol_name="L30Bank3Active"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x126C4E80" />
+        <register type="NOA" address="0x00009888" value="0x146C0000" />
+        <register type="NOA" address="0x00009888" value="0x0A633400" />
+        <register type="NOA" address="0x00009888" value="0x044E8000" />
+        <register type="NOA" address="0x00009888" value="0x064E8000" />
+        <register type="NOA" address="0x00009888" value="0x084E8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4E8000" />
+        <register type="NOA" address="0x00009888" value="0x0C4E8000" />
+        <register type="NOA" address="0x00009888" value="0x026C3321" />
+        <register type="NOA" address="0x00009888" value="0x046C342F" />
+        <register type="NOA" address="0x00009888" value="0x106C0000" />
+        <register type="NOA" address="0x00009888" value="0x1A6C2000" />
+        <register type="NOA" address="0x00009888" value="0x021BC000" />
+        <register type="NOA" address="0x00009888" value="0x041BC000" />
+        <register type="NOA" address="0x00009888" value="0x061B4000" />
+        <register type="NOA" address="0x00009888" value="0x141C8000" />
+        <register type="NOA" address="0x00009888" value="0x161C8000" />
+        <register type="NOA" address="0x00009888" value="0x181C8000" />
+        <register type="NOA" address="0x00009888" value="0x1A1C1800" />
+        <register type="NOA" address="0x00009888" value="0x06604000" />
+        <register type="NOA" address="0x00009888" value="0x0C630044" />
+        <register type="NOA" address="0x00009888" value="0x10630000" />
+        <register type="NOA" address="0x00009888" value="0x06630000" />
+        <register type="NOA" address="0x00009888" value="0x084C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C00AA" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F4000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0055" />
+        <register type="NOA" address="0x00009888" value="0x042C8000" />
+        <register type="NOA" address="0x00009888" value="0x062C8000" />
+        <register type="NOA" address="0x00009888" value="0x082C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C2C8000" />
+        <register type="NOA" address="0x00009888" value="0x1190F800" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x43900842" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900002" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00100070" />
+        <register type="OA" address="0x00002774" value="0x0000FFF1" />
+        <register type="OA" address="0x00002778" value="0x00028002" />
+        <register type="OA" address="0x0000277C" value="0x000087FF" />
+        <register type="OA" address="0x00002780" value="0x00020002" />
+        <register type="OA" address="0x00002784" value="0x00008FFF" />
+        <register type="OA" address="0x00002788" value="0x00008002" />
+        <register type="OA" address="0x0000278C" value="0x0000A7FF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set RasterizerAndPixelBackend"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="rasterizer_and_pixel_backend"
+       hw_config_guid="6e1f0a90-c65f-4da9-86d0-c79b3c0063f6"
+       chipset="CFLGT3"
+       symbol_name="RasterizerAndPixelBackend"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Slice0 Pixel Values Ready"
+             description="The percentage of time in which slice0 pixel values are ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="pixel_values0_ready"
+             units="percent"
+             symbol_name="PixelValues0Ready"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="Slice0 Rasterizer Input Available"
+             description="The percentage of time in which slice0 rasterizer input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="rasterizer0_input_available"
+             units="percent"
+             symbol_name="Rasterizer0InputAvailable"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Slice0 Post-EarlyZ Pixel Data Ready"
+             description="The percentage of time in which slice0 post-EarlyZ pixel data is ready (after early Z tests have been applied)"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="pixel_data0_ready"
+             units="percent"
+             symbol_name="PixelData0Ready"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer/Early Depth Test"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 Rasterizer Output Ready"
+             description="The percentage of time in which slice0 rasterizer output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="rasterizer0_output_ready"
+             units="percent"
+             symbol_name="Rasterizer0OutputReady"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Slice0 PS Output Available"
+             description="The percentage of time in which slice0 PS output is available"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_output0_available"
+             units="percent"
+             symbol_name="PSOutput0Available"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x102F3800" />
+        <register type="NOA" address="0x00009888" value="0x144D0500" />
+        <register type="NOA" address="0x00009888" value="0x120D03C0" />
+        <register type="NOA" address="0x00009888" value="0x140D03CF" />
+        <register type="NOA" address="0x00009888" value="0x0C0F0004" />
+        <register type="NOA" address="0x00009888" value="0x0C4E4000" />
+        <register type="NOA" address="0x00009888" value="0x042F0480" />
+        <register type="NOA" address="0x00009888" value="0x082F0000" />
+        <register type="NOA" address="0x00009888" value="0x022F0000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C0090" />
+        <register type="NOA" address="0x00009888" value="0x064D0027" />
+        <register type="NOA" address="0x00009888" value="0x004D0000" />
+        <register type="NOA" address="0x00009888" value="0x000D0D40" />
+        <register type="NOA" address="0x00009888" value="0x020D803F" />
+        <register type="NOA" address="0x00009888" value="0x040D8023" />
+        <register type="NOA" address="0x00009888" value="0x100D0000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x020F0010" />
+        <register type="NOA" address="0x00009888" value="0x000F0000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0050" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C2C8000" />
+        <register type="NOA" address="0x00009888" value="0x1190FC00" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41901400" />
+        <register type="NOA" address="0x00009888" value="0x43901485" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900001" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x30800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00000002" />
+        <register type="OA" address="0x00002774" value="0x0000EFFF" />
+        <register type="OA" address="0x00002778" value="0x00006000" />
+        <register type="OA" address="0x0000277C" value="0x0000F3FF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set Sampler"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="sampler"
+       hw_config_guid="7cb05eab-0857-4189-93bc-09326d298637"
+       chipset="CFLGT3"
+       symbol_name="Sampler"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 Subslice2 Input Available"
+             description="The percentage of time in which slice0 subslice2 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler02_input_available"
+             units="percent"
+             symbol_name="Sampler02InputAvailable"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 Subslice0 Input Available"
+             description="The percentage of time in which slice0 subslice0 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler00_input_available"
+             units="percent"
+             symbol_name="Sampler00InputAvailable"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="Slice0 Subslice2 Sampler Output Ready"
+             description="The percentage of time in which slice0 subslice2 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler02_output_ready"
+             units="percent"
+             symbol_name="Sampler02OutputReady"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Slice0 Subslice1 Input Available"
+             description="The percentage of time in which slice0 subslice1 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler01_input_available"
+             units="percent"
+             symbol_name="Sampler01InputAvailable"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Slice0 Subslice0 Sampler Output Ready"
+             description="The percentage of time in which slice0 subslice0 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler00_output_ready"
+             units="percent"
+             symbol_name="Sampler00OutputReady"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Slice0 Subslice1 Sampler Output Ready"
+             description="The percentage of time in which slice0 subslice1 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler01_output_ready"
+             units="percent"
+             symbol_name="Sampler01OutputReady"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x14152C00" />
+        <register type="NOA" address="0x00009888" value="0x16150005" />
+        <register type="NOA" address="0x00009888" value="0x121600A0" />
+        <register type="NOA" address="0x00009888" value="0x14352C00" />
+        <register type="NOA" address="0x00009888" value="0x16350005" />
+        <register type="NOA" address="0x00009888" value="0x123600A0" />
+        <register type="NOA" address="0x00009888" value="0x14552C00" />
+        <register type="NOA" address="0x00009888" value="0x16550005" />
+        <register type="NOA" address="0x00009888" value="0x125600A0" />
+        <register type="NOA" address="0x00009888" value="0x062F6000" />
+        <register type="NOA" address="0x00009888" value="0x022F2000" />
+        <register type="NOA" address="0x00009888" value="0x0C4C0050" />
+        <register type="NOA" address="0x00009888" value="0x0A4C0010" />
+        <register type="NOA" address="0x00009888" value="0x0C0D8000" />
+        <register type="NOA" address="0x00009888" value="0x0E0DA000" />
+        <register type="NOA" address="0x00009888" value="0x000D8000" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x100F0350" />
+        <register type="NOA" address="0x00009888" value="0x0C0FB000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F00DA" />
+        <register type="NOA" address="0x00009888" value="0x182C0028" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x022DC000" />
+        <register type="NOA" address="0x00009888" value="0x042D4000" />
+        <register type="NOA" address="0x00009888" value="0x0C138000" />
+        <register type="NOA" address="0x00009888" value="0x0E132000" />
+        <register type="NOA" address="0x00009888" value="0x0413C000" />
+        <register type="NOA" address="0x00009888" value="0x1C140018" />
+        <register type="NOA" address="0x00009888" value="0x0C157000" />
+        <register type="NOA" address="0x00009888" value="0x0E150078" />
+        <register type="NOA" address="0x00009888" value="0x10150000" />
+        <register type="NOA" address="0x00009888" value="0x04162180" />
+        <register type="NOA" address="0x00009888" value="0x02160000" />
+        <register type="NOA" address="0x00009888" value="0x04174000" />
+        <register type="NOA" address="0x00009888" value="0x0233A000" />
+        <register type="NOA" address="0x00009888" value="0x04333000" />
+        <register type="NOA" address="0x00009888" value="0x14348000" />
+        <register type="NOA" address="0x00009888" value="0x16348000" />
+        <register type="NOA" address="0x00009888" value="0x02357870" />
+        <register type="NOA" address="0x00009888" value="0x10350000" />
+        <register type="NOA" address="0x00009888" value="0x04360043" />
+        <register type="NOA" address="0x00009888" value="0x02360000" />
+        <register type="NOA" address="0x00009888" value="0x04371000" />
+        <register type="NOA" address="0x00009888" value="0x0E538000" />
+        <register type="NOA" address="0x00009888" value="0x00538000" />
+        <register type="NOA" address="0x00009888" value="0x06533000" />
+        <register type="NOA" address="0x00009888" value="0x1C540020" />
+        <register type="NOA" address="0x00009888" value="0x12548000" />
+        <register type="NOA" address="0x00009888" value="0x0E557000" />
+        <register type="NOA" address="0x00009888" value="0x00557800" />
+        <register type="NOA" address="0x00009888" value="0x10550000" />
+        <register type="NOA" address="0x00009888" value="0x06560043" />
+        <register type="NOA" address="0x00009888" value="0x02560000" />
+        <register type="NOA" address="0x00009888" value="0x06571000" />
+        <register type="NOA" address="0x00009888" value="0x1190FF80" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900060" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900C00" />
+        <register type="NOA" address="0x00009888" value="0x43900842" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900060" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x70800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x0000C000" />
+        <register type="OA" address="0x00002774" value="0x0000E7FF" />
+        <register type="OA" address="0x00002778" value="0x00003000" />
+        <register type="OA" address="0x0000277C" value="0x0000F9FF" />
+        <register type="OA" address="0x00002780" value="0x00000C00" />
+        <register type="OA" address="0x00002784" value="0x0000FE7F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set TDL_1"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="tdl_1"
+       hw_config_guid="05a06d02-0c12-486b-bb1d-9be053848980"
+       chipset="CFLGT3"
+       symbol_name="TDL_1"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="NonPS Thread Ready For Dispatch on Slice0 Subslice2"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice2 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread02_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread02ReadyForDispatch"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="NonPS Thread Ready For Dispatch on Slice0 Subslice0"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice0 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread00_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread00ReadyForDispatch"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Subslice0"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice0 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread00_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread00ReadyForDispatch"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Subslice1"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice1 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread01_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread01ReadyForDispatch"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Subslice2"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice2 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread02_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread02ReadyForDispatch"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="NonPS Thread Ready For Dispatch on Slice0 Subslice1"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice1 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread01_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread01ReadyForDispatch"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x12120000" />
+        <register type="NOA" address="0x00009888" value="0x12320000" />
+        <register type="NOA" address="0x00009888" value="0x12520000" />
+        <register type="NOA" address="0x00009888" value="0x002F8000" />
+        <register type="NOA" address="0x00009888" value="0x022F3000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C0015" />
+        <register type="NOA" address="0x00009888" value="0x0C0D8000" />
+        <register type="NOA" address="0x00009888" value="0x0E0DA000" />
+        <register type="NOA" address="0x00009888" value="0x000D8000" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x100F03A0" />
+        <register type="NOA" address="0x00009888" value="0x0C0FF000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0095" />
+        <register type="NOA" address="0x00009888" value="0x062C8000" />
+        <register type="NOA" address="0x00009888" value="0x082C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C2D8000" />
+        <register type="NOA" address="0x00009888" value="0x0E2D4000" />
+        <register type="NOA" address="0x00009888" value="0x062D4000" />
+        <register type="NOA" address="0x00009888" value="0x02108000" />
+        <register type="NOA" address="0x00009888" value="0x0410C000" />
+        <register type="NOA" address="0x00009888" value="0x02118000" />
+        <register type="NOA" address="0x00009888" value="0x0411C000" />
+        <register type="NOA" address="0x00009888" value="0x02121880" />
+        <register type="NOA" address="0x00009888" value="0x041219B5" />
+        <register type="NOA" address="0x00009888" value="0x00120000" />
+        <register type="NOA" address="0x00009888" value="0x02134000" />
+        <register type="NOA" address="0x00009888" value="0x04135000" />
+        <register type="NOA" address="0x00009888" value="0x0C308000" />
+        <register type="NOA" address="0x00009888" value="0x0E304000" />
+        <register type="NOA" address="0x00009888" value="0x06304000" />
+        <register type="NOA" address="0x00009888" value="0x0C318000" />
+        <register type="NOA" address="0x00009888" value="0x0E314000" />
+        <register type="NOA" address="0x00009888" value="0x06314000" />
+        <register type="NOA" address="0x00009888" value="0x0C321A80" />
+        <register type="NOA" address="0x00009888" value="0x0E320033" />
+        <register type="NOA" address="0x00009888" value="0x06320031" />
+        <register type="NOA" address="0x00009888" value="0x00320000" />
+        <register type="NOA" address="0x00009888" value="0x0C334000" />
+        <register type="NOA" address="0x00009888" value="0x0E331000" />
+        <register type="NOA" address="0x00009888" value="0x06331000" />
+        <register type="NOA" address="0x00009888" value="0x0E508000" />
+        <register type="NOA" address="0x00009888" value="0x00508000" />
+        <register type="NOA" address="0x00009888" value="0x02504000" />
+        <register type="NOA" address="0x00009888" value="0x0E518000" />
+        <register type="NOA" address="0x00009888" value="0x00518000" />
+        <register type="NOA" address="0x00009888" value="0x02514000" />
+        <register type="NOA" address="0x00009888" value="0x0E521880" />
+        <register type="NOA" address="0x00009888" value="0x00521A80" />
+        <register type="NOA" address="0x00009888" value="0x02520033" />
+        <register type="NOA" address="0x00009888" value="0x0E534000" />
+        <register type="NOA" address="0x00009888" value="0x00534000" />
+        <register type="NOA" address="0x00009888" value="0x02531000" />
+        <register type="NOA" address="0x00009888" value="0x1190FF80" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900800" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900062" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900C00" />
+        <register type="NOA" address="0x00009888" value="0x43900003" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900040" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x30800000" />
+        <register type="OA" address="0x00002770" value="0x00000002" />
+        <register type="OA" address="0x00002774" value="0x00007FFF" />
+        <register type="OA" address="0x00002778" value="0x00000000" />
+        <register type="OA" address="0x0000277C" value="0x00009FFF" />
+        <register type="OA" address="0x00002780" value="0x00000002" />
+        <register type="OA" address="0x00002784" value="0x0000EFFF" />
+        <register type="OA" address="0x00002788" value="0x00000000" />
+        <register type="OA" address="0x0000278C" value="0x0000F3FF" />
+        <register type="OA" address="0x00002790" value="0x00000002" />
+        <register type="OA" address="0x00002794" value="0x0000FDFF" />
+        <register type="OA" address="0x00002798" value="0x00000000" />
+        <register type="OA" address="0x0000279C" value="0x0000FE7F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set TDL_2"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="tdl_2"
+       hw_config_guid="cddbd1dc-41a2-4fe4-8b05-3d2773120814"
+       chipset="CFLGT3"
+       symbol_name="TDL_2"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice1 Port 0"
+             description="The percentage of time in which thread header is ready on slice0 subslice1 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header01_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader01ReadyPort0"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice1 Port 1"
+             description="The percentage of time in which thread header is ready on slice0 subslice1 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header01_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader01ReadyPort1"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice2 Port 1"
+             description="The percentage of time in which thread header is ready on slice0 subslice2 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header02_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader02ReadyPort1"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice2 Port 0"
+             description="The percentage of time in which thread header is ready on slice0 subslice2 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header02_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader02ReadyPort0"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice0 Port 0"
+             description="The percentage of time in which thread header is ready on slice0 subslice0 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header00_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader00ReadyPort0"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice0 Port 1"
+             description="The percentage of time in which thread header is ready on slice0 subslice0 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header00_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader00ReadyPort1"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x12124D60" />
+        <register type="NOA" address="0x00009888" value="0x12322E60" />
+        <register type="NOA" address="0x00009888" value="0x12524D60" />
+        <register type="NOA" address="0x00009888" value="0x022F3000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C0014" />
+        <register type="NOA" address="0x00009888" value="0x000D8000" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x0C0FE000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0097" />
+        <register type="NOA" address="0x00009888" value="0x082C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x002D8000" />
+        <register type="NOA" address="0x00009888" value="0x062D4000" />
+        <register type="NOA" address="0x00009888" value="0x0410C000" />
+        <register type="NOA" address="0x00009888" value="0x0411C000" />
+        <register type="NOA" address="0x00009888" value="0x04121FB7" />
+        <register type="NOA" address="0x00009888" value="0x00120000" />
+        <register type="NOA" address="0x00009888" value="0x04135000" />
+        <register type="NOA" address="0x00009888" value="0x00308000" />
+        <register type="NOA" address="0x00009888" value="0x06304000" />
+        <register type="NOA" address="0x00009888" value="0x00318000" />
+        <register type="NOA" address="0x00009888" value="0x06314000" />
+        <register type="NOA" address="0x00009888" value="0x00321B80" />
+        <register type="NOA" address="0x00009888" value="0x0632003F" />
+        <register type="NOA" address="0x00009888" value="0x00334000" />
+        <register type="NOA" address="0x00009888" value="0x06331000" />
+        <register type="NOA" address="0x00009888" value="0x0250C000" />
+        <register type="NOA" address="0x00009888" value="0x0251C000" />
+        <register type="NOA" address="0x00009888" value="0x02521FB7" />
+        <register type="NOA" address="0x00009888" value="0x00520000" />
+        <register type="NOA" address="0x00009888" value="0x02535000" />
+        <register type="NOA" address="0x00009888" value="0x1190FC00" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900800" />
+        <register type="NOA" address="0x00009888" value="0x43900063" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900040" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Compute Metrics Extra Gen9"
+       mdapi_supported_apis="VK OGL4 OCL IO BB"
+       underscore_name="compute_extra"
+       hw_config_guid="e61ae394-9d9e-4204-a735-1dad7e44d953"
+       chipset="CFLGT3"
+       symbol_name="ComputeExtra"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active"
+             units="percent"
+             symbol_name="Fpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Pipe Active including Ext Math"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing including Extended Math processing"
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ  C 5 READ C 6 READ FADD C 7 READ FADD C 2 READ FADD C 3 READ FADD C 4 READ FADD 8 FMUL FADD 100 FMUL $EuCoresTotalCount FDIV $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active_adjusted"
+             units="percent"
+             symbol_name="Fpu1ActiveAdjusted"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x121203E0" />
+        <register type="NOA" address="0x00009888" value="0x123203E0" />
+        <register type="NOA" address="0x00009888" value="0x125203E0" />
+        <register type="NOA" address="0x00009888" value="0x129203E0" />
+        <register type="NOA" address="0x00009888" value="0x12B203E0" />
+        <register type="NOA" address="0x00009888" value="0x12D203E0" />
+        <register type="NOA" address="0x00009888" value="0x024EC000" />
+        <register type="NOA" address="0x00009888" value="0x044EC000" />
+        <register type="NOA" address="0x00009888" value="0x064EC000" />
+        <register type="NOA" address="0x00009888" value="0x022F4000" />
+        <register type="NOA" address="0x00009888" value="0x084CA000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C0042" />
+        <register type="NOA" address="0x00009888" value="0x000D8000" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F5000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F006D" />
+        <register type="NOA" address="0x00009888" value="0x022C8000" />
+        <register type="NOA" address="0x00009888" value="0x042C8000" />
+        <register type="NOA" address="0x00009888" value="0x062C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C2C8000" />
+        <register type="NOA" address="0x00009888" value="0x042D8000" />
+        <register type="NOA" address="0x00009888" value="0x06104000" />
+        <register type="NOA" address="0x00009888" value="0x06114000" />
+        <register type="NOA" address="0x00009888" value="0x06120033" />
+        <register type="NOA" address="0x00009888" value="0x00120000" />
+        <register type="NOA" address="0x00009888" value="0x06131000" />
+        <register type="NOA" address="0x00009888" value="0x04308000" />
+        <register type="NOA" address="0x00009888" value="0x04318000" />
+        <register type="NOA" address="0x00009888" value="0x04321980" />
+        <register type="NOA" address="0x00009888" value="0x00320000" />
+        <register type="NOA" address="0x00009888" value="0x04334000" />
+        <register type="NOA" address="0x00009888" value="0x04504000" />
+        <register type="NOA" address="0x00009888" value="0x04514000" />
+        <register type="NOA" address="0x00009888" value="0x04520033" />
+        <register type="NOA" address="0x00009888" value="0x00520000" />
+        <register type="NOA" address="0x00009888" value="0x04531000" />
+        <register type="NOA" address="0x00009888" value="0x00AF8000" />
+        <register type="NOA" address="0x00009888" value="0x0ACC0001" />
+        <register type="NOA" address="0x00009888" value="0x008D8000" />
+        <register type="NOA" address="0x00009888" value="0x028DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C8FB000" />
+        <register type="NOA" address="0x00009888" value="0x0E8F0001" />
+        <register type="NOA" address="0x00009888" value="0x06AC8000" />
+        <register type="NOA" address="0x00009888" value="0x02AD4000" />
+        <register type="NOA" address="0x00009888" value="0x02908000" />
+        <register type="NOA" address="0x00009888" value="0x02918000" />
+        <register type="NOA" address="0x00009888" value="0x02921980" />
+        <register type="NOA" address="0x00009888" value="0x00920000" />
+        <register type="NOA" address="0x00009888" value="0x02934000" />
+        <register type="NOA" address="0x00009888" value="0x02B04000" />
+        <register type="NOA" address="0x00009888" value="0x02B14000" />
+        <register type="NOA" address="0x00009888" value="0x02B20033" />
+        <register type="NOA" address="0x00009888" value="0x00B20000" />
+        <register type="NOA" address="0x00009888" value="0x02B31000" />
+        <register type="NOA" address="0x00009888" value="0x00D08000" />
+        <register type="NOA" address="0x00009888" value="0x00D18000" />
+        <register type="NOA" address="0x00009888" value="0x00D21980" />
+        <register type="NOA" address="0x00009888" value="0x00D34000" />
+        <register type="NOA" address="0x00009888" value="0x1190FC00" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900C00" />
+        <register type="NOA" address="0x00009888" value="0x43900002" />
+        <register type="NOA" address="0x00009888" value="0x53900420" />
+        <register type="NOA" address="0x00009888" value="0x459000A1" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+  </set>
+
+  <set name="Media Vme Pipe Gen9"
+       mdapi_supported_apis="MEDIA IO BB"
+       underscore_name="vme_pipe"
+       hw_config_guid="94272ad9-45ee-4e34-b7a7-51546cd6405c"
+       chipset="CFLGT3"
+       symbol_name="VMEPipe"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="EU Thread Occupancy"
+             description="The percentage of time in which hardware threads occupied EUs."
+             data_type="float"
+             max_equation="100"
+             equation="8 A 10 READ FMUL $EuThreadsCount FDIV $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_thread_occupancy"
+             units="percent"
+             symbol_name="EuThreadOccupancy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VME Busy"
+             description="The percentage of time in which VME (IME or CRE) was actively processing data."
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ B 3 READ FADD 2 FDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vme_busy"
+             units="percent"
+             symbol_name="VMEBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Overview System Batch Tier2"
+             mdapi_group="VME Pipe"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x141A5800" />
+        <register type="NOA" address="0x00009888" value="0x161A00C0" />
+        <register type="NOA" address="0x00009888" value="0x12180240" />
+        <register type="NOA" address="0x00009888" value="0x14180002" />
+        <register type="NOA" address="0x00009888" value="0x149A5800" />
+        <register type="NOA" address="0x00009888" value="0x169A00C0" />
+        <register type="NOA" address="0x00009888" value="0x12980240" />
+        <register type="NOA" address="0x00009888" value="0x14980002" />
+        <register type="NOA" address="0x00009888" value="0x1A4E3FC0" />
+        <register type="NOA" address="0x00009888" value="0x002F1000" />
+        <register type="NOA" address="0x00009888" value="0x022F8000" />
+        <register type="NOA" address="0x00009888" value="0x042F3000" />
+        <register type="NOA" address="0x00009888" value="0x004C4000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C9500" />
+        <register type="NOA" address="0x00009888" value="0x0C4C002A" />
+        <register type="NOA" address="0x00009888" value="0x000D2000" />
+        <register type="NOA" address="0x00009888" value="0x060D8000" />
+        <register type="NOA" address="0x00009888" value="0x080DA000" />
+        <register type="NOA" address="0x00009888" value="0x0A0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F0400" />
+        <register type="NOA" address="0x00009888" value="0x0E0F5500" />
+        <register type="NOA" address="0x00009888" value="0x100F0015" />
+        <register type="NOA" address="0x00009888" value="0x002C8000" />
+        <register type="NOA" address="0x00009888" value="0x0E2C8000" />
+        <register type="NOA" address="0x00009888" value="0x162CAA00" />
+        <register type="NOA" address="0x00009888" value="0x182C000A" />
+        <register type="NOA" address="0x00009888" value="0x04193000" />
+        <register type="NOA" address="0x00009888" value="0x081A28C1" />
+        <register type="NOA" address="0x00009888" value="0x001A0000" />
+        <register type="NOA" address="0x00009888" value="0x00133000" />
+        <register type="NOA" address="0x00009888" value="0x0613C000" />
+        <register type="NOA" address="0x00009888" value="0x0813F000" />
+        <register type="NOA" address="0x00009888" value="0x00172000" />
+        <register type="NOA" address="0x00009888" value="0x06178000" />
+        <register type="NOA" address="0x00009888" value="0x0817A000" />
+        <register type="NOA" address="0x00009888" value="0x00180037" />
+        <register type="NOA" address="0x00009888" value="0x06180940" />
+        <register type="NOA" address="0x00009888" value="0x08180000" />
+        <register type="NOA" address="0x00009888" value="0x02180000" />
+        <register type="NOA" address="0x00009888" value="0x04183000" />
+        <register type="NOA" address="0x00009888" value="0x04AFC000" />
+        <register type="NOA" address="0x00009888" value="0x06AF3000" />
+        <register type="NOA" address="0x00009888" value="0x0ACC4000" />
+        <register type="NOA" address="0x00009888" value="0x0CCC0015" />
+        <register type="NOA" address="0x00009888" value="0x0A8DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C8DA000" />
+        <register type="NOA" address="0x00009888" value="0x0E8F4000" />
+        <register type="NOA" address="0x00009888" value="0x108F0015" />
+        <register type="NOA" address="0x00009888" value="0x16ACA000" />
+        <register type="NOA" address="0x00009888" value="0x18AC000A" />
+        <register type="NOA" address="0x00009888" value="0x06993000" />
+        <register type="NOA" address="0x00009888" value="0x0C9A28C1" />
+        <register type="NOA" address="0x00009888" value="0x009A0000" />
+        <register type="NOA" address="0x00009888" value="0x0A93F000" />
+        <register type="NOA" address="0x00009888" value="0x0C93F000" />
+        <register type="NOA" address="0x00009888" value="0x0A97A000" />
+        <register type="NOA" address="0x00009888" value="0x0C97A000" />
+        <register type="NOA" address="0x00009888" value="0x0A980977" />
+        <register type="NOA" address="0x00009888" value="0x08980000" />
+        <register type="NOA" address="0x00009888" value="0x04980000" />
+        <register type="NOA" address="0x00009888" value="0x06983000" />
+        <register type="NOA" address="0x00009888" value="0x119000FF" />
+        <register type="NOA" address="0x00009888" value="0x51900040" />
+        <register type="NOA" address="0x00009888" value="0x41900020" />
+        <register type="NOA" address="0x00009888" value="0x55900004" />
+        <register type="NOA" address="0x00009888" value="0x45900400" />
+        <register type="NOA" address="0x00009888" value="0x479008A5" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900002" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x30800000" />
+        <register type="OA" address="0x00002770" value="0x00100030" />
+        <register type="OA" address="0x00002774" value="0x0000FFF9" />
+        <register type="OA" address="0x00002778" value="0x00000002" />
+        <register type="OA" address="0x0000277C" value="0x0000FFFC" />
+        <register type="OA" address="0x00002780" value="0x00000002" />
+        <register type="OA" address="0x00002784" value="0x0000FFF3" />
+        <register type="OA" address="0x00002788" value="0x00100180" />
+        <register type="OA" address="0x0000278C" value="0x0000FFCF" />
+        <register type="OA" address="0x00002790" value="0x00000002" />
+        <register type="OA" address="0x00002794" value="0x0000FFCF" />
+        <register type="OA" address="0x00002798" value="0x00000002" />
+        <register type="OA" address="0x0000279C" value="0x0000FF3F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00008003" />
+    </register_config>
+  </set>
+
+  <set name="Gpu Rings Busyness"
+       mdapi_supported_apis="VK OGL OCL MEDIA IO BB"
+       underscore_name="gpu_busyness"
+       hw_config_guid="22b7e0c2-cade-425f-b099-34479768c72a"
+       chipset="CFLGT3"
+       symbol_name="GpuBusyness"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="Vebox Ring Busy"
+             description="The percentage of time when vebox command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vebox_busy"
+             units="percent"
+             symbol_name="VeboxBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Render Ring Busy"
+             description="The percentage of time when render command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="render_busy"
+             units="percent"
+             symbol_name="RenderBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Vdbox0 Ring Busy"
+             description="The percentage of time when Vdbox0 command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vdbox0_busy"
+             units="percent"
+             symbol_name="Vdbox0Busy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Blitter Ring Busy"
+             description="The percentage of time when blitter command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="blitter_busy"
+             units="percent"
+             symbol_name="BlitterBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="AnyRingBusy"
+             description="The percentage of time when any command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="any_ring_busy"
+             units="percent"
+             symbol_name="AnyRingBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Vdbox1 Ring Busy"
+             description="The percentage of time when Vdbox1 command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vdbox1_busy"
+             units="percent"
+             symbol_name="Vdbox1Busy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x19D05800" />
+        <register type="NOA" address="0x00009888" value="0x13805800" />
+        <register type="NOA" address="0x00009888" value="0x05962C25" />
+        <register type="NOA" address="0x00009888" value="0x19950016" />
+        <register type="NOA" address="0x00009888" value="0x19C05800" />
+        <register type="NOA" address="0x00009888" value="0x05D00085" />
+        <register type="NOA" address="0x00009888" value="0x25D00000" />
+        <register type="NOA" address="0x00009888" value="0x09D54000" />
+        <register type="NOA" address="0x00009888" value="0x07800035" />
+        <register type="NOA" address="0x00009888" value="0x11800000" />
+        <register type="NOA" address="0x00009888" value="0x1D810400" />
+        <register type="NOA" address="0x00009888" value="0x21960000" />
+        <register type="NOA" address="0x00009888" value="0x0996C000" />
+        <register type="NOA" address="0x00009888" value="0x0B964000" />
+        <register type="NOA" address="0x00009888" value="0x19938000" />
+        <register type="NOA" address="0x00009888" value="0x1B930068" />
+        <register type="NOA" address="0x00009888" value="0x15948000" />
+        <register type="NOA" address="0x00009888" value="0x1B94000C" />
+        <register type="NOA" address="0x00009888" value="0x03957500" />
+        <register type="NOA" address="0x00009888" value="0x1D950000" />
+        <register type="NOA" address="0x00009888" value="0x17950000" />
+        <register type="NOA" address="0x00009888" value="0x07E54000" />
+        <register type="NOA" address="0x00009888" value="0x07928000" />
+        <register type="NOA" address="0x00009888" value="0x03988000" />
+        <register type="NOA" address="0x00009888" value="0x17908000" />
+        <register type="NOA" address="0x00009888" value="0x19904000" />
+        <register type="NOA" address="0x00009888" value="0x1B908000" />
+        <register type="NOA" address="0x00009888" value="0x1D908000" />
+        <register type="NOA" address="0x00009888" value="0x1F908000" />
+        <register type="NOA" address="0x00009888" value="0x09978000" />
+        <register type="NOA" address="0x00009888" value="0x05C08500" />
+        <register type="NOA" address="0x00009888" value="0x25C00000" />
+        <register type="NOA" address="0x00009888" value="0x1BC00000" />
+        <register type="NOA" address="0x00009888" value="0x0BC54000" />
+        <register type="NOA" address="0x00009888" value="0x11900000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x43900463" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900040" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x10800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x0007C000" />
+        <register type="OA" address="0x00002774" value="0x000007FF" />
+    </register_config>
+  </set>
+
+  <set name="MDAPI testing set Gen9"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="test_oa"
+       hw_config_guid="577e8e2c-3fa0-4875-8743-3538d585e3b0"
+       chipset="CFLGT3"
+       symbol_name="TestOa"
+       >
+    <counter name="TestCounter7"
+             description="HW test counter 7. Factor: 0.666"
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="counter7"
+             units="events"
+             symbol_name="Counter7"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="TestCounter8"
+             description="HW test counter 8. Should be equal to 1."
+             data_type="uint64"
+             equation="C 7 READ"
+             underscore_name="counter8"
+             units="events"
+             symbol_name="Counter8"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter4"
+             description="HW test counter 4. Factor: 0.333"
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="counter4"
+             units="events"
+             symbol_name="Counter4"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter5"
+             description="HW test counter 5. Factor: 0.333"
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="counter5"
+             units="events"
+             symbol_name="Counter5"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter6"
+             description="HW test counter 6. Factor: 0.166"
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="counter6"
+             units="events"
+             symbol_name="Counter6"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter3"
+             description="HW test counter 3. Factor: 0.5"
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="counter3"
+             units="events"
+             symbol_name="Counter3"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter0"
+             description="HW test counter 0. Factor: 0.0"
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="counter0"
+             units="events"
+             symbol_name="Counter0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter1"
+             description="HW test counter 1. Factor: 1.0"
+             data_type="uint64"
+             equation="B 1 READ"
+             underscore_name="counter1"
+             units="events"
+             symbol_name="Counter1"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter2"
+             description="HW test counter 2. Factor: 1.0"
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="counter2"
+             units="events"
+             symbol_name="Counter2"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x11810000" />
+        <register type="NOA" address="0x00009888" value="0x07810013" />
+        <register type="NOA" address="0x00009888" value="0x1F810000" />
+        <register type="NOA" address="0x00009888" value="0x1D810000" />
+        <register type="NOA" address="0x00009888" value="0x1B930040" />
+        <register type="NOA" address="0x00009888" value="0x07E54000" />
+        <register type="NOA" address="0x00009888" value="0x1F908000" />
+        <register type="NOA" address="0x00009888" value="0x11900000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x00000004" />
+        <register type="OA" address="0x00002774" value="0x00000000" />
+        <register type="OA" address="0x00002778" value="0x00000003" />
+        <register type="OA" address="0x0000277C" value="0x00000000" />
+        <register type="OA" address="0x00002780" value="0x00000007" />
+        <register type="OA" address="0x00002784" value="0x00000000" />
+        <register type="OA" address="0x00002788" value="0x00100002" />
+        <register type="OA" address="0x0000278C" value="0x0000FFF7" />
+        <register type="OA" address="0x00002790" value="0x00100002" />
+        <register type="OA" address="0x00002794" value="0x0000FFCF" />
+        <register type="OA" address="0x00002798" value="0x00100082" />
+        <register type="OA" address="0x0000279C" value="0x0000FFEF" />
+        <register type="OA" address="0x000027A0" value="0x001000C2" />
+        <register type="OA" address="0x000027A4" value="0x0000FFE7" />
+        <register type="OA" address="0x000027A8" value="0x00100001" />
+        <register type="OA" address="0x000027AC" value="0x0000FFE7" />
+    </register_config>
+  </set>
+
+  <set name="Metric set PMA Stall"
+       mdapi_supported_apis="VK OGL OGL4 OCL IO MEDIA"
+       underscore_name="pma__stall"
+       hw_config_guid="c11af8d1-858b-4f8b-98fb-8d683ba8bda0"
+       chipset="CFLGT3"
+       symbol_name="PMA_Stall"
+       >
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="STC PMA stall"
+             description="Percentage of time when stencil cache line and an overlapping pixel are causing stalls"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ B 1 READ FADD 2 FDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="stc_pma_stall"
+             units="percent"
+             symbol_name="StcPMAStall"
+             availability="$SliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_group="GPU/Stencil Cache"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x122D3080" />
+        <register type="NOA" address="0x00009888" value="0x000D2000" />
+        <register type="NOA" address="0x00009888" value="0x060D8000" />
+        <register type="NOA" address="0x00009888" value="0x080DA000" />
+        <register type="NOA" address="0x00009888" value="0x0A0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F0800" />
+        <register type="NOA" address="0x00009888" value="0x0E0FAA00" />
+        <register type="NOA" address="0x00009888" value="0x100F0002" />
+        <register type="NOA" address="0x00009888" value="0x002D0025" />
+        <register type="NOA" address="0x00009888" value="0x062D1300" />
+        <register type="NOA" address="0x00009888" value="0x082D16A4" />
+        <register type="NOA" address="0x00009888" value="0x0A2D162E" />
+        <register type="NOA" address="0x00009888" value="0x102D0000" />
+        <register type="NOA" address="0x00009888" value="0x1190003F" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900000" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900000" />
+        <register type="NOA" address="0x00009888" value="0x47900000" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x30800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00E00021" />
+        <register type="OA" address="0x00002774" value="0x0007FFF8" />
+        <register type="OA" address="0x00002778" value="0x07000101" />
+        <register type="OA" address="0x0000277C" value="0x0038FFC7" />
+    </register_config>
+  </set>
+
+</metrics>
diff --git a/lib/i915/perf-configs/oa-chv.xml b/lib/i915/perf-configs/oa-chv.xml
new file mode 100644
index 00000000..6267bb96
--- /dev/null
+++ b/lib/i915/perf-configs/oa-chv.xml
@@ -0,0 +1,9757 @@
+<?xml version="1.0"?>
+<metrics version="1581935518" merge_md5="">
+  <set name="Render Metrics Basic Gen8LP"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="render_basic"
+       hw_config_guid="9d8a3af5-c02c-4a4a-b947-f1672469e0fb"
+       chipset="CHV"
+       symbol_name="RenderBasic"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Misses"
+             description="The total number of L3 misses."
+             data_type="uint64"
+             equation="C 4 READ"
+             underscore_name="l3_misses"
+             units="messages"
+             symbol_name="L3Misses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/TAG"
+             />
+    <counter name="GTI L3 Throughput"
+             description="The total number of GPU memory bytes transferred between L3 caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="$L3Misses 64 UMUL"
+             underscore_name="gti_l3_throughput"
+             units="bytes"
+             symbol_name="GtiL3Throughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler 1 Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which Sampler 1 has been slowing down the pipe when processing EU requests."
+             data_type="float"
+             high_watermark="15"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="sampler1_bottleneck"
+             units="percent"
+             symbol_name="Sampler1Bottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="L3 Sampler Throughput"
+             description="The total number of GPU memory bytes transferred between samplers and L3 caches."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="A 29 READ 64 UMUL"
+             underscore_name="l3_sampler_throughput"
+             units="bytes"
+             symbol_name="L3SamplerThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Sampler"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Sampler 0 Busy"
+             description="The percentage of time in which Sampler 0 has been processing EU requests."
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler0_busy"
+             units="percent"
+             symbol_name="Sampler0Busy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Sampler 1 Busy"
+             description="The percentage of time in which Sampler 1 has been processing EU requests."
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler1_busy"
+             units="percent"
+             symbol_name="Sampler1Busy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Samplers Busy"
+             description="The percentage of time in which samplers have been processing EU requests."
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ  B 1 READ UADD $GpuCoreClocks FDIV 2 FDIV 100 FMUL"
+             underscore_name="samplers_busy"
+             units="percent"
+             symbol_name="SamplersBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Fixed Pipe Throughput"
+             description="The total number of GPU memory bytes transferred between 3D Pipeline (Command Dispatch, Input Assembly and Stream Output) and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="B 6 READ B 7 READ UADD 64 UMUL"
+             underscore_name="gti_vf_throughput"
+             units="bytes"
+             symbol_name="GtiVfThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/3D Pipe"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler 0 Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which Sampler 0 has been slowing down the pipe when processing EU requests."
+             data_type="float"
+             high_watermark="15"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="sampler0_bottleneck"
+             units="percent"
+             symbol_name="Sampler0Bottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Read Throughput"
+             description="The total number of GPU memory bytes read from GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="C 6 READ 64 UMUL"
+             underscore_name="gti_read_throughput"
+             units="bytes"
+             symbol_name="GtiReadThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Depth Throughput"
+             description="The total number of GPU memory bytes transferred between depth caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="C 0 READ C 1 READ UADD 64 UMUL"
+             underscore_name="gti_depth_throughput"
+             units="bytes"
+             symbol_name="GtiDepthThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/Depth Cache"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Samplers Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which samplers have been slowing down the pipe when processing EU requests."
+             data_type="float"
+             high_watermark="15"
+             equation="$Sampler0Bottleneck $Sampler1Bottleneck FMAX"
+             max_equation="100"
+             underscore_name="sampler_bottleneck"
+             units="percent"
+             symbol_name="SamplerBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Indicate System Frame Batch Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="GTI HDC TLB Lookup Throughput"
+             description="The total number of GPU memory bytes transferred between GTI and HDC, when HDC is doing TLB lookups."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 5 READ 64 UMUL"
+             underscore_name="gti_hdc_lookups_throughput"
+             units="bytes"
+             symbol_name="GtiHdcLookupsThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI RCC Throughput"
+             description="The total number of GPU memory bytes transferred between render color caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="C 2 READ C 3 READ UADD 64 UMUL"
+             underscore_name="gti_rcc_throughput"
+             units="bytes"
+             symbol_name="GtiRccThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/Color Cache"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="GTI Write Throughput"
+             description="The total number of GPU memory bytes written to GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 32 UMUL"
+             equation="C 7 READ 64 UMUL"
+             underscore_name="gti_write_throughput"
+             units="bytes"
+             symbol_name="GtiWriteThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL 2 UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses UADD UADD 64 UMUL"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x59800000" />
+        <register type="NOA" address="0x00009888" value="0x59800001" />
+        <register type="NOA" address="0x00009888" value="0x285A0006" />
+        <register type="NOA" address="0x00009888" value="0x2C110014" />
+        <register type="NOA" address="0x00009888" value="0x2E110000" />
+        <register type="NOA" address="0x00009888" value="0x2C310014" />
+        <register type="NOA" address="0x00009888" value="0x2E310000" />
+        <register type="NOA" address="0x00009888" value="0x2B8303DF" />
+        <register type="NOA" address="0x00009888" value="0x3580024F" />
+        <register type="NOA" address="0x00009888" value="0x00580888" />
+        <register type="NOA" address="0x00009888" value="0x1E5A0015" />
+        <register type="NOA" address="0x00009888" value="0x205A0014" />
+        <register type="NOA" address="0x00009888" value="0x045A0000" />
+        <register type="NOA" address="0x00009888" value="0x025A0000" />
+        <register type="NOA" address="0x00009888" value="0x02180500" />
+        <register type="NOA" address="0x00009888" value="0x00190555" />
+        <register type="NOA" address="0x00009888" value="0x021D0500" />
+        <register type="NOA" address="0x00009888" value="0x021F0A00" />
+        <register type="NOA" address="0x00009888" value="0x00380444" />
+        <register type="NOA" address="0x00009888" value="0x02390500" />
+        <register type="NOA" address="0x00009888" value="0x003A0666" />
+        <register type="NOA" address="0x00009888" value="0x00100111" />
+        <register type="NOA" address="0x00009888" value="0x06110030" />
+        <register type="NOA" address="0x00009888" value="0x0A110031" />
+        <register type="NOA" address="0x00009888" value="0x0E110046" />
+        <register type="NOA" address="0x00009888" value="0x04110000" />
+        <register type="NOA" address="0x00009888" value="0x00110000" />
+        <register type="NOA" address="0x00009888" value="0x00130111" />
+        <register type="NOA" address="0x00009888" value="0x00300444" />
+        <register type="NOA" address="0x00009888" value="0x08310030" />
+        <register type="NOA" address="0x00009888" value="0x0C310031" />
+        <register type="NOA" address="0x00009888" value="0x10310046" />
+        <register type="NOA" address="0x00009888" value="0x04310000" />
+        <register type="NOA" address="0x00009888" value="0x00310000" />
+        <register type="NOA" address="0x00009888" value="0x00330444" />
+        <register type="NOA" address="0x00009888" value="0x038A0A00" />
+        <register type="NOA" address="0x00009888" value="0x018B0FFF" />
+        <register type="NOA" address="0x00009888" value="0x038B0A00" />
+        <register type="NOA" address="0x00009888" value="0x01855000" />
+        <register type="NOA" address="0x00009888" value="0x03850055" />
+        <register type="NOA" address="0x00009888" value="0x13830021" />
+        <register type="NOA" address="0x00009888" value="0x15830020" />
+        <register type="NOA" address="0x00009888" value="0x1783002F" />
+        <register type="NOA" address="0x00009888" value="0x1983002E" />
+        <register type="NOA" address="0x00009888" value="0x1B83002D" />
+        <register type="NOA" address="0x00009888" value="0x1D83002C" />
+        <register type="NOA" address="0x00009888" value="0x05830000" />
+        <register type="NOA" address="0x00009888" value="0x01840555" />
+        <register type="NOA" address="0x00009888" value="0x03840500" />
+        <register type="NOA" address="0x00009888" value="0x23800074" />
+        <register type="NOA" address="0x00009888" value="0x2580007D" />
+        <register type="NOA" address="0x00009888" value="0x05800000" />
+        <register type="NOA" address="0x00009888" value="0x01805000" />
+        <register type="NOA" address="0x00009888" value="0x03800055" />
+        <register type="NOA" address="0x00009888" value="0x01865000" />
+        <register type="NOA" address="0x00009888" value="0x03860055" />
+        <register type="NOA" address="0x00009888" value="0x01875000" />
+        <register type="NOA" address="0x00009888" value="0x03870055" />
+        <register type="NOA" address="0x00009888" value="0x418000AA" />
+        <register type="NOA" address="0x00009888" value="0x4380000A" />
+        <register type="NOA" address="0x00009888" value="0x45800000" />
+        <register type="NOA" address="0x00009888" value="0x4780000A" />
+        <register type="NOA" address="0x00009888" value="0x49800000" />
+        <register type="NOA" address="0x00009888" value="0x4B800000" />
+        <register type="NOA" address="0x00009888" value="0x4D800000" />
+        <register type="NOA" address="0x00009888" value="0x4F800000" />
+        <register type="NOA" address="0x00009888" value="0x51800000" />
+        <register type="NOA" address="0x00009888" value="0x53800000" />
+        <register type="NOA" address="0x00009888" value="0x55800000" />
+        <register type="NOA" address="0x00009888" value="0x57800000" />
+        <register type="NOA" address="0x00009888" value="0x59800000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Compute Metrics Basic Gen8LP"
+       mdapi_supported_apis="VK OGL4 OCL IO BB"
+       underscore_name="compute_basic"
+       hw_config_guid="f522a89c-ecd1-4522-8331-3383c54af5f5"
+       chipset="CHV"
+       symbol_name="ComputeBasic"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Untyped Bytes Read"
+             description="The total number of typed memory bytes read via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="B 4 READ B 5 READ UADD 64 UMUL"
+             underscore_name="untyped_bytes_read"
+             units="bytes"
+             symbol_name="UntypedBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Typed Bytes Written"
+             description="The total number of untyped memory bytes written via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="B 2 READ B 3 READ UADD 64 UMUL"
+             underscore_name="typed_bytes_written"
+             units="bytes"
+             symbol_name="TypedBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu0_active"
+             units="percent"
+             symbol_name="Fpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active"
+             units="percent"
+             symbol_name="Fpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU AVG IPC Rate"
+             description="The average rate of IPC calculated for 2 FPU pipelines."
+             data_type="float"
+             max_equation="2"
+             equation="A 9 READ  A 10 READ  A 11 READ UADD  A 9 READ USUB FDIV 1 FADD"
+             underscore_name="eu_avg_ipc_rate"
+             units="number"
+             symbol_name="EuAvgIpcRate"
+             semantic_type="ratio"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Read Throughput"
+             description="The total number of GPU memory bytes read from GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="C 0 READ 64 UMUL"
+             underscore_name="gti_read_throughput"
+             units="bytes"
+             symbol_name="GtiReadThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Ring Throughput"
+             description="The total number of GPU memory bytes transferred between GTI and Uncore ring."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 128 UMUL"
+             equation="C 2 READ 128 UMUL"
+             underscore_name="gti_ring_throughput"
+             units="bytes"
+             symbol_name="GtiRingThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Untyped Writes"
+             description="The total number of untyped memory bytes written via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="B 6 READ B 7 READ UADD $EuSlicesTotalCount 64 UMUL UMUL"
+             underscore_name="untyped_bytes_written"
+             units="bytes"
+             symbol_name="UntypedBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="Typed Bytes Read"
+             description="The total number of typed memory bytes read via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="B 0 READ B 1 READ UADD 64 UMUL"
+             underscore_name="typed_bytes_read"
+             units="bytes"
+             symbol_name="TypedBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Read-Only Stall"
+             description="The percentage of time in which GTI Read-Only port has been stalled."
+             data_type="float"
+             max_equation="100"
+             equation="C 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gti_ro_stall"
+             units="percent"
+             symbol_name="GtiRoStall"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="EU Thread Occupancy"
+             description="The percentage of time in which hardware threads occupied EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ 8 UMUL $EuCoresTotalCount UDIV $EuThreadsCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_thread_occupancy"
+             units="percent"
+             symbol_name="EuThreadOccupancy"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Read-Write Stall"
+             description="The percentage of time in which GTI Read-Write port has been stalled."
+             data_type="float"
+             max_equation="100"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gti_rw_stall"
+             units="percent"
+             symbol_name="GtiRwStall"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="GTI Write Throughput"
+             description="The total number of GPU memory bytes written to GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 32 UMUL"
+             equation="C 1 READ 64 UMUL"
+             underscore_name="gti_write_throughput"
+             units="bytes"
+             symbol_name="GtiWriteThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL 2 UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses UADD UADD 64 UMUL"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="EU Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_send_active"
+             units="percent"
+             symbol_name="EuSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x59800000" />
+        <register type="NOA" address="0x00009888" value="0x59800001" />
+        <register type="NOA" address="0x00009888" value="0x2E5800E0" />
+        <register type="NOA" address="0x00009888" value="0x2E3800E0" />
+        <register type="NOA" address="0x00009888" value="0x3580024F" />
+        <register type="NOA" address="0x00009888" value="0x3D800140" />
+        <register type="NOA" address="0x00009888" value="0x08580042" />
+        <register type="NOA" address="0x00009888" value="0x0C580040" />
+        <register type="NOA" address="0x00009888" value="0x1058004C" />
+        <register type="NOA" address="0x00009888" value="0x1458004B" />
+        <register type="NOA" address="0x00009888" value="0x04580000" />
+        <register type="NOA" address="0x00009888" value="0x00580000" />
+        <register type="NOA" address="0x00009888" value="0x00195555" />
+        <register type="NOA" address="0x00009888" value="0x06380042" />
+        <register type="NOA" address="0x00009888" value="0x0A380040" />
+        <register type="NOA" address="0x00009888" value="0x0E38004C" />
+        <register type="NOA" address="0x00009888" value="0x1238004B" />
+        <register type="NOA" address="0x00009888" value="0x04380000" />
+        <register type="NOA" address="0x00009888" value="0x00384444" />
+        <register type="NOA" address="0x00009888" value="0x003A5555" />
+        <register type="NOA" address="0x00009888" value="0x018BFFFF" />
+        <register type="NOA" address="0x00009888" value="0x01845555" />
+        <register type="NOA" address="0x00009888" value="0x17800074" />
+        <register type="NOA" address="0x00009888" value="0x1980007D" />
+        <register type="NOA" address="0x00009888" value="0x1B80007C" />
+        <register type="NOA" address="0x00009888" value="0x1D8000B6" />
+        <register type="NOA" address="0x00009888" value="0x1F8000B7" />
+        <register type="NOA" address="0x00009888" value="0x05800000" />
+        <register type="NOA" address="0x00009888" value="0x03800000" />
+        <register type="NOA" address="0x00009888" value="0x418000AA" />
+        <register type="NOA" address="0x00009888" value="0x438000AA" />
+        <register type="NOA" address="0x00009888" value="0x45800000" />
+        <register type="NOA" address="0x00009888" value="0x47800000" />
+        <register type="NOA" address="0x00009888" value="0x4980012A" />
+        <register type="NOA" address="0x00009888" value="0x4B80012A" />
+        <register type="NOA" address="0x00009888" value="0x4D80012A" />
+        <register type="NOA" address="0x00009888" value="0x4F80012A" />
+        <register type="NOA" address="0x00009888" value="0x518001CE" />
+        <register type="NOA" address="0x00009888" value="0x538001CE" />
+        <register type="NOA" address="0x00009888" value="0x5580000E" />
+        <register type="NOA" address="0x00009888" value="0x59800000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00000003" />
+        <register type="FLEX" address="0x0000E658" value="0x00002001" />
+        <register type="FLEX" address="0x0000E758" value="0x00778008" />
+        <register type="FLEX" address="0x0000E45C" value="0x00088078" />
+        <register type="FLEX" address="0x0000E55C" value="0x00808708" />
+        <register type="FLEX" address="0x0000E65C" value="0x00A08908" />
+    </register_config>
+  </set>
+
+  <set name="Render Metrics for 3D Pipeline Profile"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="render_pipe_profile"
+       hw_config_guid="a9ccc03d-a943-4e6b-9cd6-13e063075927"
+       chipset="CHV"
+       symbol_name="RenderPipeProfile"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Bottleneck"
+             low_watermark="10"
+             description="The percentage of time in which vertex shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="30"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_bottleneck"
+             units="percent"
+             symbol_name="VsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Hi-Depth Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which early hierarchical depth test pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="hi_depth_bottleneck"
+             units="percent"
+             symbol_name="HiDepthBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which geometry shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gs_bottleneck"
+             units="percent"
+             symbol_name="GsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Geometry Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="BC Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which barycentric coordinates calculation pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="bc_bottleneck"
+             units="percent"
+             symbol_name="BcBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Barycentric Calc"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HS Stall"
+             description="The percentage of time in which hull stall pipeline stage was stalled."
+             data_type="float"
+             equation="C 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="hs_stall"
+             units="percent"
+             symbol_name="HsStall"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Hull Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="VF Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which vertex fetch pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="C 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vf_bottleneck"
+             units="percent"
+             symbol_name="VfBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Input Assembler"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Strip-Fans Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which strip-fans pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="10"
+             equation="B 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sf_bottleneck"
+             units="percent"
+             symbol_name="SfBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Strip-Fans"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Accesses"
+             description="The total number of messages send to samplers."
+             data_type="uint64"
+             equation="A 28 READ"
+             underscore_name="sampler_accesses"
+             units="messages"
+             symbol_name="SamplerAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler"
+             />
+    <counter name="SF Stall"
+             description="The percentage of time in which strip-fans pipeline stage was stalled."
+             data_type="float"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sf_stall"
+             units="percent"
+             symbol_name="SfStall"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Strip-Fans"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HS Bottleneck"
+             low_watermark="3"
+             description="The percentage of time in which hull shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="9"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="hs_bottleneck"
+             units="percent"
+             symbol_name="HsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Hull Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="CL Stall"
+             description="The percentage of time in which clipper pipeline stage was stalled."
+             data_type="float"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="cl_stall"
+             units="percent"
+             symbol_name="ClStall"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Clipper"
+             />
+    <counter name="SO Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which stream output pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="so_bottleneck"
+             units="percent"
+             symbol_name="SoBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Stream Output"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="DS Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which domain shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ds_bottleneck"
+             units="percent"
+             symbol_name="DsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Domain Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Clipper Bottleneck"
+             low_watermark="10"
+             description="The percentage of time in which clipper pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="30"
+             equation="B 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="cl_bottleneck"
+             units="percent"
+             symbol_name="ClBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Clipper"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Stall"
+             description="The percentage of time in which domain shader pipeline stage was stalled."
+             data_type="float"
+             equation="C 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ds_stall"
+             units="percent"
+             symbol_name="DsStall"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Domain Shader"
+             />
+    <counter name="Early Depth Bottleneck"
+             low_watermark="10"
+             description="The percentage of time in which early depth test pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="30"
+             equation="B 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="early_depth_bottleneck"
+             units="percent"
+             symbol_name="EarlyDepthBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL 2 UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses UADD UADD 64 UMUL"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="SO Stall"
+             description="The percentage of time in which stream-output pipeline stage was stalled."
+             data_type="float"
+             equation="C 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="so_stall"
+             units="percent"
+             symbol_name="SoStall"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Stream Output"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x59800000" />
+        <register type="NOA" address="0x00009888" value="0x59800001" />
+        <register type="NOA" address="0x00009888" value="0x261E0000" />
+        <register type="NOA" address="0x00009888" value="0x281F000F" />
+        <register type="NOA" address="0x00009888" value="0x2817001A" />
+        <register type="NOA" address="0x00009888" value="0x2791001F" />
+        <register type="NOA" address="0x00009888" value="0x27880019" />
+        <register type="NOA" address="0x00009888" value="0x2D890000" />
+        <register type="NOA" address="0x00009888" value="0x278A0007" />
+        <register type="NOA" address="0x00009888" value="0x298D001F" />
+        <register type="NOA" address="0x00009888" value="0x278E0020" />
+        <register type="NOA" address="0x00009888" value="0x2B8F0012" />
+        <register type="NOA" address="0x00009888" value="0x29900000" />
+        <register type="NOA" address="0x00009888" value="0x00184000" />
+        <register type="NOA" address="0x00009888" value="0x02181000" />
+        <register type="NOA" address="0x00009888" value="0x02194000" />
+        <register type="NOA" address="0x00009888" value="0x141E0002" />
+        <register type="NOA" address="0x00009888" value="0x041E0000" />
+        <register type="NOA" address="0x00009888" value="0x001E0000" />
+        <register type="NOA" address="0x00009888" value="0x221F0015" />
+        <register type="NOA" address="0x00009888" value="0x041F0000" />
+        <register type="NOA" address="0x00009888" value="0x001F4000" />
+        <register type="NOA" address="0x00009888" value="0x021F0000" />
+        <register type="NOA" address="0x00009888" value="0x023A8000" />
+        <register type="NOA" address="0x00009888" value="0x0213C000" />
+        <register type="NOA" address="0x00009888" value="0x02164000" />
+        <register type="NOA" address="0x00009888" value="0x24170012" />
+        <register type="NOA" address="0x00009888" value="0x04170000" />
+        <register type="NOA" address="0x00009888" value="0x07910005" />
+        <register type="NOA" address="0x00009888" value="0x05910000" />
+        <register type="NOA" address="0x00009888" value="0x01911500" />
+        <register type="NOA" address="0x00009888" value="0x03910501" />
+        <register type="NOA" address="0x00009888" value="0x0D880002" />
+        <register type="NOA" address="0x00009888" value="0x1D880003" />
+        <register type="NOA" address="0x00009888" value="0x05880000" />
+        <register type="NOA" address="0x00009888" value="0x0B890032" />
+        <register type="NOA" address="0x00009888" value="0x1B890031" />
+        <register type="NOA" address="0x00009888" value="0x05890000" />
+        <register type="NOA" address="0x00009888" value="0x01890040" />
+        <register type="NOA" address="0x00009888" value="0x03890040" />
+        <register type="NOA" address="0x00009888" value="0x098A0000" />
+        <register type="NOA" address="0x00009888" value="0x198A0004" />
+        <register type="NOA" address="0x00009888" value="0x058A0000" />
+        <register type="NOA" address="0x00009888" value="0x018A8050" />
+        <register type="NOA" address="0x00009888" value="0x038A2050" />
+        <register type="NOA" address="0x00009888" value="0x018B95A9" />
+        <register type="NOA" address="0x00009888" value="0x038BE5A9" />
+        <register type="NOA" address="0x00009888" value="0x018C1500" />
+        <register type="NOA" address="0x00009888" value="0x038C0501" />
+        <register type="NOA" address="0x00009888" value="0x178D0015" />
+        <register type="NOA" address="0x00009888" value="0x058D0000" />
+        <register type="NOA" address="0x00009888" value="0x138E0004" />
+        <register type="NOA" address="0x00009888" value="0x218E000C" />
+        <register type="NOA" address="0x00009888" value="0x058E0000" />
+        <register type="NOA" address="0x00009888" value="0x018E0500" />
+        <register type="NOA" address="0x00009888" value="0x038E0101" />
+        <register type="NOA" address="0x00009888" value="0x0F8F0027" />
+        <register type="NOA" address="0x00009888" value="0x058F0000" />
+        <register type="NOA" address="0x00009888" value="0x018F0000" />
+        <register type="NOA" address="0x00009888" value="0x038F0001" />
+        <register type="NOA" address="0x00009888" value="0x11900013" />
+        <register type="NOA" address="0x00009888" value="0x1F900017" />
+        <register type="NOA" address="0x00009888" value="0x05900000" />
+        <register type="NOA" address="0x00009888" value="0x01900100" />
+        <register type="NOA" address="0x00009888" value="0x03900001" />
+        <register type="NOA" address="0x00009888" value="0x01845555" />
+        <register type="NOA" address="0x00009888" value="0x03845555" />
+        <register type="NOA" address="0x00009888" value="0x418000AA" />
+        <register type="NOA" address="0x00009888" value="0x438000AA" />
+        <register type="NOA" address="0x00009888" value="0x458000AA" />
+        <register type="NOA" address="0x00009888" value="0x478000AA" />
+        <register type="NOA" address="0x00009888" value="0x4980018C" />
+        <register type="NOA" address="0x00009888" value="0x4B80014B" />
+        <register type="NOA" address="0x00009888" value="0x4D800128" />
+        <register type="NOA" address="0x00009888" value="0x4F80012A" />
+        <register type="NOA" address="0x00009888" value="0x51800187" />
+        <register type="NOA" address="0x00009888" value="0x5380014B" />
+        <register type="NOA" address="0x00009888" value="0x55800149" />
+        <register type="NOA" address="0x00009888" value="0x5780010A" />
+        <register type="NOA" address="0x00009888" value="0x59800000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007FFEA" />
+        <register type="OA" address="0x00002774" value="0x00007FFC" />
+        <register type="OA" address="0x00002778" value="0x0007AFFA" />
+        <register type="OA" address="0x0000277C" value="0x0000F5FD" />
+        <register type="OA" address="0x00002780" value="0x00079FFA" />
+        <register type="OA" address="0x00002784" value="0x0000F3FB" />
+        <register type="OA" address="0x00002788" value="0x0007BF7A" />
+        <register type="OA" address="0x0000278C" value="0x0000F7E7" />
+        <register type="OA" address="0x00002790" value="0x0007FEFA" />
+        <register type="OA" address="0x00002794" value="0x0000F7CF" />
+        <register type="OA" address="0x00002798" value="0x00077FFA" />
+        <register type="OA" address="0x0000279C" value="0x0000EFDF" />
+        <register type="OA" address="0x000027A0" value="0x0006FFFA" />
+        <register type="OA" address="0x000027A4" value="0x0000CFBF" />
+        <register type="OA" address="0x000027A8" value="0x0003FFFA" />
+        <register type="OA" address="0x000027AC" value="0x00005F7F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00015014" />
+        <register type="FLEX" address="0x0000E658" value="0x00025024" />
+        <register type="FLEX" address="0x0000E758" value="0x00035034" />
+        <register type="FLEX" address="0x0000E45C" value="0x00045044" />
+        <register type="FLEX" address="0x0000E55C" value="0x00055054" />
+        <register type="FLEX" address="0x0000E65C" value="0x00065064" />
+    </register_config>
+  </set>
+
+  <set name="Metric set HDCAndSF"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="hdc_and_sf"
+       hw_config_guid="33af8252-7a51-4aa3-b0ba-1b946f209d7b"
+       chipset="CHV"
+       symbol_name="HDCAndSF"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="Polygon Data Ready"
+             description="The percentage of time in which geometry pipeline output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="poly_data_ready"
+             units="percent"
+             symbol_name="PolyDataReady"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe/Strip-Fans"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="HDC stalled by L3 (s0.ss2)"
+             description="Percentage of time when HDC has messges to L3, but it's stalled due to lack of credits (s0.ss2)"
+             data_type="float"
+             max_equation="100"
+             equation="C 1 READ C 0 READ USUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader12_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader12AccessStalledOnL3"
+             availability="$SubsliceMask 0x20 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="HDC stalled by L3 (s0.ss1)"
+             description="Percentage of time when HDC has messges to L3, but it's stalled due to lack of credits (s0.ss1)"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ C 4 READ USUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader01_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader01AccessStalledOnL3"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="HDC stalled by L3 (s0.ss2)"
+             description="Percentage of time when HDC has messges to L3, but it's stalled due to lack of credits (s0.ss2)"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ C 6 READ USUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader02_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader02AccessStalledOnL3"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HDC stalled by L3 (s0.ss0)"
+             description="Percentage of time when HDC has messges to L3, but it's stalled due to lack of credits (s0.ss0)"
+             data_type="float"
+             max_equation="100"
+             equation="B 5 READ B 4 READ USUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader10_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader10AccessStalledOnL3"
+             availability="$SubsliceMask 0x8 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="HDC stalled by L3 (s0.ss1)"
+             description="Percentage of time when HDC has messges to L3, but it's stalled due to lack of credits (s0.ss1)"
+             data_type="float"
+             max_equation="100"
+             equation="B 7 READ B 6 READ USUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader11_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader11AccessStalledOnL3"
+             availability="$SubsliceMask 0x10 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL 2 UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="HDC stalled by L3 (s0.ss0)"
+             description="Percentage of time when HDC has messges to L3, but it's stalled due to lack of credits (s0.ss0)"
+             data_type="float"
+             max_equation="100"
+             equation="C 3 READ C 2 READ USUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader00_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader00AccessStalledOnL3"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x105C0232" />
+        <register type="NOA" address="0x00009888" value="0x10580232" />
+        <register type="NOA" address="0x00009888" value="0x10380232" />
+        <register type="NOA" address="0x00009888" value="0x10DC0232" />
+        <register type="NOA" address="0x00009888" value="0x10D80232" />
+        <register type="NOA" address="0x00009888" value="0x10B80232" />
+        <register type="NOA" address="0x00009888" value="0x118E4400" />
+        <register type="NOA" address="0x00009888" value="0x025C6080" />
+        <register type="NOA" address="0x00009888" value="0x045C004B" />
+        <register type="NOA" address="0x00009888" value="0x005C8000" />
+        <register type="NOA" address="0x00009888" value="0x00582080" />
+        <register type="NOA" address="0x00009888" value="0x0258004B" />
+        <register type="NOA" address="0x00009888" value="0x025B4000" />
+        <register type="NOA" address="0x00009888" value="0x045B4000" />
+        <register type="NOA" address="0x00009888" value="0x0C1FA000" />
+        <register type="NOA" address="0x00009888" value="0x0E1F00AA" />
+        <register type="NOA" address="0x00009888" value="0x04386080" />
+        <register type="NOA" address="0x00009888" value="0x0638404B" />
+        <register type="NOA" address="0x00009888" value="0x02384000" />
+        <register type="NOA" address="0x00009888" value="0x08384000" />
+        <register type="NOA" address="0x00009888" value="0x0A380000" />
+        <register type="NOA" address="0x00009888" value="0x0C380000" />
+        <register type="NOA" address="0x00009888" value="0x00398000" />
+        <register type="NOA" address="0x00009888" value="0x0239A000" />
+        <register type="NOA" address="0x00009888" value="0x0439A000" />
+        <register type="NOA" address="0x00009888" value="0x06392000" />
+        <register type="NOA" address="0x00009888" value="0x0CDC25C1" />
+        <register type="NOA" address="0x00009888" value="0x0ADCC000" />
+        <register type="NOA" address="0x00009888" value="0x0AD825C1" />
+        <register type="NOA" address="0x00009888" value="0x18DB4000" />
+        <register type="NOA" address="0x00009888" value="0x1ADB0001" />
+        <register type="NOA" address="0x00009888" value="0x0E9F8000" />
+        <register type="NOA" address="0x00009888" value="0x109F02AA" />
+        <register type="NOA" address="0x00009888" value="0x0EB825C1" />
+        <register type="NOA" address="0x00009888" value="0x18B80154" />
+        <register type="NOA" address="0x00009888" value="0x0AB9A000" />
+        <register type="NOA" address="0x00009888" value="0x0CB9A000" />
+        <register type="NOA" address="0x00009888" value="0x0EB9A000" />
+        <register type="NOA" address="0x00009888" value="0x0D88C000" />
+        <register type="NOA" address="0x00009888" value="0x0F88000F" />
+        <register type="NOA" address="0x00009888" value="0x038A8000" />
+        <register type="NOA" address="0x00009888" value="0x058A8000" />
+        <register type="NOA" address="0x00009888" value="0x078A8000" />
+        <register type="NOA" address="0x00009888" value="0x098A8000" />
+        <register type="NOA" address="0x00009888" value="0x0B8A8000" />
+        <register type="NOA" address="0x00009888" value="0x0D8A8000" />
+        <register type="NOA" address="0x00009888" value="0x258BAA05" />
+        <register type="NOA" address="0x00009888" value="0x278B002A" />
+        <register type="NOA" address="0x00009888" value="0x238B2A80" />
+        <register type="NOA" address="0x00009888" value="0x198C5400" />
+        <register type="NOA" address="0x00009888" value="0x1B8C0015" />
+        <register type="NOA" address="0x00009888" value="0x098DC000" />
+        <register type="NOA" address="0x00009888" value="0x0B8DA000" />
+        <register type="NOA" address="0x00009888" value="0x0D8DA000" />
+        <register type="NOA" address="0x00009888" value="0x0F8DA000" />
+        <register type="NOA" address="0x00009888" value="0x098E05C0" />
+        <register type="NOA" address="0x00009888" value="0x058E0000" />
+        <register type="NOA" address="0x00009888" value="0x198F0020" />
+        <register type="NOA" address="0x00009888" value="0x2185AA0A" />
+        <register type="NOA" address="0x00009888" value="0x2385002A" />
+        <register type="NOA" address="0x00009888" value="0x1F85AA00" />
+        <register type="NOA" address="0x00009888" value="0x19835000" />
+        <register type="NOA" address="0x00009888" value="0x1B830155" />
+        <register type="NOA" address="0x00009888" value="0x03834000" />
+        <register type="NOA" address="0x00009888" value="0x05834000" />
+        <register type="NOA" address="0x00009888" value="0x07834000" />
+        <register type="NOA" address="0x00009888" value="0x09834000" />
+        <register type="NOA" address="0x00009888" value="0x0B834000" />
+        <register type="NOA" address="0x00009888" value="0x0D834000" />
+        <register type="NOA" address="0x00009888" value="0x09848000" />
+        <register type="NOA" address="0x00009888" value="0x0B84C000" />
+        <register type="NOA" address="0x00009888" value="0x0D84C000" />
+        <register type="NOA" address="0x00009888" value="0x0F84C000" />
+        <register type="NOA" address="0x00009888" value="0x01848000" />
+        <register type="NOA" address="0x00009888" value="0x0384C000" />
+        <register type="NOA" address="0x00009888" value="0x0584C000" />
+        <register type="NOA" address="0x00009888" value="0x07844000" />
+        <register type="NOA" address="0x00009888" value="0x19808000" />
+        <register type="NOA" address="0x00009888" value="0x1B80C000" />
+        <register type="NOA" address="0x00009888" value="0x1D80C000" />
+        <register type="NOA" address="0x00009888" value="0x1F80C000" />
+        <register type="NOA" address="0x00009888" value="0x11808000" />
+        <register type="NOA" address="0x00009888" value="0x1380C000" />
+        <register type="NOA" address="0x00009888" value="0x1580C000" />
+        <register type="NOA" address="0x00009888" value="0x17804000" />
+        <register type="NOA" address="0x00009888" value="0x51800040" />
+        <register type="NOA" address="0x00009888" value="0x43800400" />
+        <register type="NOA" address="0x00009888" value="0x45800800" />
+        <register type="NOA" address="0x00009888" value="0x53800000" />
+        <register type="NOA" address="0x00009888" value="0x47800C62" />
+        <register type="NOA" address="0x00009888" value="0x21800000" />
+        <register type="NOA" address="0x00009888" value="0x31800000" />
+        <register type="NOA" address="0x00009888" value="0x4D800000" />
+        <register type="NOA" address="0x00009888" value="0x3F801042" />
+        <register type="NOA" address="0x00009888" value="0x4F800000" />
+        <register type="NOA" address="0x00009888" value="0x418014A4" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x10800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00000002" />
+        <register type="OA" address="0x00002774" value="0x0000FFF7" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set L3_1"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="l3_1"
+       hw_config_guid="78f52900-5317-4417-8067-966fbf215a1f"
+       chipset="CHV"
+       symbol_name="L3_1"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice1 L3 Bank1 Stalled"
+             description="The percentage of time in which slice1 L3 bank1 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l31_bank1_stalled"
+             units="percent"
+             symbol_name="L31Bank1Stalled"
+             availability="$SliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Slice1 L3 Bank0 Stalled"
+             description="The percentage of time in which slice1 L3 bank0 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l31_bank0_stalled"
+             units="percent"
+             symbol_name="L31Bank0Stalled"
+             availability="$SliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="Slice1 L3 Bank1 Active"
+             description="The percentage of time in which slice1 L3 bank1 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l31_bank1_active"
+             units="percent"
+             symbol_name="L31Bank1Active"
+             availability="$SliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice1 L3 Bank0 Active"
+             description="The percentage of time in which slice1 L3 bank0 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l31_bank0_active"
+             units="percent"
+             symbol_name="L31Bank0Active"
+             availability="$SliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL 2 UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x10BF03DA" />
+        <register type="NOA" address="0x00009888" value="0x14BF0001" />
+        <register type="NOA" address="0x00009888" value="0x12980340" />
+        <register type="NOA" address="0x00009888" value="0x12990340" />
+        <register type="NOA" address="0x00009888" value="0x0CBF1187" />
+        <register type="NOA" address="0x00009888" value="0x0EBF1205" />
+        <register type="NOA" address="0x00009888" value="0x00BF0500" />
+        <register type="NOA" address="0x00009888" value="0x02BF042B" />
+        <register type="NOA" address="0x00009888" value="0x04BF002C" />
+        <register type="NOA" address="0x00009888" value="0x0CDAC000" />
+        <register type="NOA" address="0x00009888" value="0x0EDAC000" />
+        <register type="NOA" address="0x00009888" value="0x00DA8000" />
+        <register type="NOA" address="0x00009888" value="0x02DAC000" />
+        <register type="NOA" address="0x00009888" value="0x04DA4000" />
+        <register type="NOA" address="0x00009888" value="0x04983400" />
+        <register type="NOA" address="0x00009888" value="0x10980000" />
+        <register type="NOA" address="0x00009888" value="0x06990034" />
+        <register type="NOA" address="0x00009888" value="0x10990000" />
+        <register type="NOA" address="0x00009888" value="0x0C9DC000" />
+        <register type="NOA" address="0x00009888" value="0x0E9DC000" />
+        <register type="NOA" address="0x00009888" value="0x009D8000" />
+        <register type="NOA" address="0x00009888" value="0x029DC000" />
+        <register type="NOA" address="0x00009888" value="0x049D4000" />
+        <register type="NOA" address="0x00009888" value="0x109F02A8" />
+        <register type="NOA" address="0x00009888" value="0x0C9FA000" />
+        <register type="NOA" address="0x00009888" value="0x0E9F00BA" />
+        <register type="NOA" address="0x00009888" value="0x0CB88000" />
+        <register type="NOA" address="0x00009888" value="0x0CB95000" />
+        <register type="NOA" address="0x00009888" value="0x0EB95000" />
+        <register type="NOA" address="0x00009888" value="0x00B94000" />
+        <register type="NOA" address="0x00009888" value="0x02B95000" />
+        <register type="NOA" address="0x00009888" value="0x04B91000" />
+        <register type="NOA" address="0x00009888" value="0x06B92000" />
+        <register type="NOA" address="0x00009888" value="0x0CBA4000" />
+        <register type="NOA" address="0x00009888" value="0x0F88000F" />
+        <register type="NOA" address="0x00009888" value="0x03888000" />
+        <register type="NOA" address="0x00009888" value="0x05888000" />
+        <register type="NOA" address="0x00009888" value="0x07888000" />
+        <register type="NOA" address="0x00009888" value="0x09888000" />
+        <register type="NOA" address="0x00009888" value="0x0B888000" />
+        <register type="NOA" address="0x00009888" value="0x0D880400" />
+        <register type="NOA" address="0x00009888" value="0x258B800A" />
+        <register type="NOA" address="0x00009888" value="0x278B002A" />
+        <register type="NOA" address="0x00009888" value="0x238B5500" />
+        <register type="NOA" address="0x00009888" value="0x198C4000" />
+        <register type="NOA" address="0x00009888" value="0x1B8C0015" />
+        <register type="NOA" address="0x00009888" value="0x038C4000" />
+        <register type="NOA" address="0x00009888" value="0x058C4000" />
+        <register type="NOA" address="0x00009888" value="0x078C4000" />
+        <register type="NOA" address="0x00009888" value="0x098C4000" />
+        <register type="NOA" address="0x00009888" value="0x0B8C4000" />
+        <register type="NOA" address="0x00009888" value="0x0D8C4000" />
+        <register type="NOA" address="0x00009888" value="0x0D8DA000" />
+        <register type="NOA" address="0x00009888" value="0x0F8DA000" />
+        <register type="NOA" address="0x00009888" value="0x018D8000" />
+        <register type="NOA" address="0x00009888" value="0x038DA000" />
+        <register type="NOA" address="0x00009888" value="0x058DA000" />
+        <register type="NOA" address="0x00009888" value="0x078D2000" />
+        <register type="NOA" address="0x00009888" value="0x2185800A" />
+        <register type="NOA" address="0x00009888" value="0x2385002A" />
+        <register type="NOA" address="0x00009888" value="0x1F85AA00" />
+        <register type="NOA" address="0x00009888" value="0x1B830154" />
+        <register type="NOA" address="0x00009888" value="0x03834000" />
+        <register type="NOA" address="0x00009888" value="0x05834000" />
+        <register type="NOA" address="0x00009888" value="0x07834000" />
+        <register type="NOA" address="0x00009888" value="0x09834000" />
+        <register type="NOA" address="0x00009888" value="0x0B834000" />
+        <register type="NOA" address="0x00009888" value="0x0D834000" />
+        <register type="NOA" address="0x00009888" value="0x0D84C000" />
+        <register type="NOA" address="0x00009888" value="0x0F84C000" />
+        <register type="NOA" address="0x00009888" value="0x01848000" />
+        <register type="NOA" address="0x00009888" value="0x0384C000" />
+        <register type="NOA" address="0x00009888" value="0x0584C000" />
+        <register type="NOA" address="0x00009888" value="0x07844000" />
+        <register type="NOA" address="0x00009888" value="0x1D80C000" />
+        <register type="NOA" address="0x00009888" value="0x1F80C000" />
+        <register type="NOA" address="0x00009888" value="0x11808000" />
+        <register type="NOA" address="0x00009888" value="0x1380C000" />
+        <register type="NOA" address="0x00009888" value="0x1580C000" />
+        <register type="NOA" address="0x00009888" value="0x17804000" />
+        <register type="NOA" address="0x00009888" value="0x53800000" />
+        <register type="NOA" address="0x00009888" value="0x45800000" />
+        <register type="NOA" address="0x00009888" value="0x47800000" />
+        <register type="NOA" address="0x00009888" value="0x21800000" />
+        <register type="NOA" address="0x00009888" value="0x31800000" />
+        <register type="NOA" address="0x00009888" value="0x4D800000" />
+        <register type="NOA" address="0x00009888" value="0x3F800000" />
+        <register type="NOA" address="0x00009888" value="0x4F800000" />
+        <register type="NOA" address="0x00009888" value="0x41800060" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002770" value="0x00100070" />
+        <register type="OA" address="0x00002774" value="0x0000FFF1" />
+        <register type="OA" address="0x00002778" value="0x00014002" />
+        <register type="OA" address="0x0000277C" value="0x0000C3FF" />
+        <register type="OA" address="0x00002780" value="0x00010002" />
+        <register type="OA" address="0x00002784" value="0x0000C7FF" />
+        <register type="OA" address="0x00002788" value="0x00004002" />
+        <register type="OA" address="0x0000278C" value="0x0000D3FF" />
+        <register type="OA" address="0x00002790" value="0x00100700" />
+        <register type="OA" address="0x00002794" value="0x0000FF1F" />
+        <register type="OA" address="0x00002798" value="0x00001402" />
+        <register type="OA" address="0x0000279C" value="0x0000FC3F" />
+        <register type="OA" address="0x000027A0" value="0x00001002" />
+        <register type="OA" address="0x000027A4" value="0x0000FC7F" />
+        <register type="OA" address="0x000027A8" value="0x00000402" />
+        <register type="OA" address="0x000027AC" value="0x0000FD3F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set L3_2"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="l3_2"
+       hw_config_guid="0db4fe4a-2648-4064-bd6a-89c06d0c27b3"
+       chipset="CHV"
+       symbol_name="L3_2"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank1 Active"
+             description="The percentage of time in which slice0 L3 bank1 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank1_active"
+             units="percent"
+             symbol_name="L30Bank1Active"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="Slice0 L3 Bank1 Stalled"
+             description="The percentage of time in which slice0 L3 bank1 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank1_stalled"
+             units="percent"
+             symbol_name="L30Bank1Stalled"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank0 Active"
+             description="The percentage of time in which slice0 L3 bank0 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank0_active"
+             units="percent"
+             symbol_name="L30Bank0Active"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank0 Stalled"
+             description="The percentage of time in which slice0 L3 bank0 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank0_stalled"
+             units="percent"
+             symbol_name="L30Bank0Stalled"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL 2 UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x103F03DA" />
+        <register type="NOA" address="0x00009888" value="0x143F0001" />
+        <register type="NOA" address="0x00009888" value="0x12180340" />
+        <register type="NOA" address="0x00009888" value="0x12190340" />
+        <register type="NOA" address="0x00009888" value="0x0C3F1187" />
+        <register type="NOA" address="0x00009888" value="0x0E3F1205" />
+        <register type="NOA" address="0x00009888" value="0x003F0500" />
+        <register type="NOA" address="0x00009888" value="0x023F042B" />
+        <register type="NOA" address="0x00009888" value="0x043F002C" />
+        <register type="NOA" address="0x00009888" value="0x0C5AC000" />
+        <register type="NOA" address="0x00009888" value="0x0E5AC000" />
+        <register type="NOA" address="0x00009888" value="0x005A8000" />
+        <register type="NOA" address="0x00009888" value="0x025AC000" />
+        <register type="NOA" address="0x00009888" value="0x045A4000" />
+        <register type="NOA" address="0x00009888" value="0x04183400" />
+        <register type="NOA" address="0x00009888" value="0x10180000" />
+        <register type="NOA" address="0x00009888" value="0x06190034" />
+        <register type="NOA" address="0x00009888" value="0x10190000" />
+        <register type="NOA" address="0x00009888" value="0x0C1DC000" />
+        <register type="NOA" address="0x00009888" value="0x0E1DC000" />
+        <register type="NOA" address="0x00009888" value="0x001D8000" />
+        <register type="NOA" address="0x00009888" value="0x021DC000" />
+        <register type="NOA" address="0x00009888" value="0x041D4000" />
+        <register type="NOA" address="0x00009888" value="0x101F02A8" />
+        <register type="NOA" address="0x00009888" value="0x0C1FA000" />
+        <register type="NOA" address="0x00009888" value="0x0E1F00BA" />
+        <register type="NOA" address="0x00009888" value="0x0C388000" />
+        <register type="NOA" address="0x00009888" value="0x0C395000" />
+        <register type="NOA" address="0x00009888" value="0x0E395000" />
+        <register type="NOA" address="0x00009888" value="0x00394000" />
+        <register type="NOA" address="0x00009888" value="0x02395000" />
+        <register type="NOA" address="0x00009888" value="0x04391000" />
+        <register type="NOA" address="0x00009888" value="0x06392000" />
+        <register type="NOA" address="0x00009888" value="0x0C3A4000" />
+        <register type="NOA" address="0x00009888" value="0x1B8AA800" />
+        <register type="NOA" address="0x00009888" value="0x1D8A0002" />
+        <register type="NOA" address="0x00009888" value="0x038A8000" />
+        <register type="NOA" address="0x00009888" value="0x058A8000" />
+        <register type="NOA" address="0x00009888" value="0x078A8000" />
+        <register type="NOA" address="0x00009888" value="0x098A8000" />
+        <register type="NOA" address="0x00009888" value="0x0B8A8000" />
+        <register type="NOA" address="0x00009888" value="0x0D8A8000" />
+        <register type="NOA" address="0x00009888" value="0x258B4005" />
+        <register type="NOA" address="0x00009888" value="0x278B0015" />
+        <register type="NOA" address="0x00009888" value="0x238B2A80" />
+        <register type="NOA" address="0x00009888" value="0x2185800A" />
+        <register type="NOA" address="0x00009888" value="0x2385002A" />
+        <register type="NOA" address="0x00009888" value="0x1F85AA00" />
+        <register type="NOA" address="0x00009888" value="0x1B830154" />
+        <register type="NOA" address="0x00009888" value="0x03834000" />
+        <register type="NOA" address="0x00009888" value="0x05834000" />
+        <register type="NOA" address="0x00009888" value="0x07834000" />
+        <register type="NOA" address="0x00009888" value="0x09834000" />
+        <register type="NOA" address="0x00009888" value="0x0B834000" />
+        <register type="NOA" address="0x00009888" value="0x0D834000" />
+        <register type="NOA" address="0x00009888" value="0x0D84C000" />
+        <register type="NOA" address="0x00009888" value="0x0F84C000" />
+        <register type="NOA" address="0x00009888" value="0x01848000" />
+        <register type="NOA" address="0x00009888" value="0x0384C000" />
+        <register type="NOA" address="0x00009888" value="0x0584C000" />
+        <register type="NOA" address="0x00009888" value="0x07844000" />
+        <register type="NOA" address="0x00009888" value="0x1D80C000" />
+        <register type="NOA" address="0x00009888" value="0x1F80C000" />
+        <register type="NOA" address="0x00009888" value="0x11808000" />
+        <register type="NOA" address="0x00009888" value="0x1380C000" />
+        <register type="NOA" address="0x00009888" value="0x1580C000" />
+        <register type="NOA" address="0x00009888" value="0x17804000" />
+        <register type="NOA" address="0x00009888" value="0x53800000" />
+        <register type="NOA" address="0x00009888" value="0x45800000" />
+        <register type="NOA" address="0x00009888" value="0x47800000" />
+        <register type="NOA" address="0x00009888" value="0x21800000" />
+        <register type="NOA" address="0x00009888" value="0x31800000" />
+        <register type="NOA" address="0x00009888" value="0x4D800000" />
+        <register type="NOA" address="0x00009888" value="0x3F800000" />
+        <register type="NOA" address="0x00009888" value="0x4F800000" />
+        <register type="NOA" address="0x00009888" value="0x41800060" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002770" value="0x00100070" />
+        <register type="OA" address="0x00002774" value="0x0000FFF1" />
+        <register type="OA" address="0x00002778" value="0x00014002" />
+        <register type="OA" address="0x0000277C" value="0x0000C3FF" />
+        <register type="OA" address="0x00002780" value="0x00010002" />
+        <register type="OA" address="0x00002784" value="0x0000C7FF" />
+        <register type="OA" address="0x00002788" value="0x00004002" />
+        <register type="OA" address="0x0000278C" value="0x0000D3FF" />
+        <register type="OA" address="0x00002790" value="0x00100700" />
+        <register type="OA" address="0x00002794" value="0x0000FF1F" />
+        <register type="OA" address="0x00002798" value="0x00001402" />
+        <register type="OA" address="0x0000279C" value="0x0000FC3F" />
+        <register type="OA" address="0x000027A0" value="0x00001002" />
+        <register type="OA" address="0x000027A4" value="0x0000FC7F" />
+        <register type="OA" address="0x000027A8" value="0x00000402" />
+        <register type="OA" address="0x000027AC" value="0x0000FD3F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set L3_3"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="l3_3"
+       hw_config_guid="0de6539e-33b4-4aee-83c4-9ab45a579b94"
+       chipset="CHV"
+       symbol_name="L3_3"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Slice0 L3 Bank3 Stalled"
+             description="The percentage of time in which slice0 L3 bank3 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank3_stalled"
+             units="percent"
+             symbol_name="L30Bank3Stalled"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank3 Active"
+             description="The percentage of time in which slice0 L3 bank3 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank3_active"
+             units="percent"
+             symbol_name="L30Bank3Active"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice1 L3 Bank3 Active"
+             description="The percentage of time in which slice1 L3 bank3 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l31_bank3_active"
+             units="percent"
+             symbol_name="L31Bank3Active"
+             availability="$SliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Slice1 L3 Bank3 Stalled"
+             description="The percentage of time in which slice1 L3 bank3 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l31_bank3_stalled"
+             units="percent"
+             symbol_name="L31Bank3Stalled"
+             availability="$SliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL 2 UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x121B0340" />
+        <register type="NOA" address="0x00009888" value="0x103F0274" />
+        <register type="NOA" address="0x00009888" value="0x123F0000" />
+        <register type="NOA" address="0x00009888" value="0x129B0340" />
+        <register type="NOA" address="0x00009888" value="0x10BF0274" />
+        <register type="NOA" address="0x00009888" value="0x12BF0000" />
+        <register type="NOA" address="0x00009888" value="0x041B3400" />
+        <register type="NOA" address="0x00009888" value="0x101B0000" />
+        <register type="NOA" address="0x00009888" value="0x045C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A3D4000" />
+        <register type="NOA" address="0x00009888" value="0x003F0080" />
+        <register type="NOA" address="0x00009888" value="0x023F0793" />
+        <register type="NOA" address="0x00009888" value="0x043F0014" />
+        <register type="NOA" address="0x00009888" value="0x04588000" />
+        <register type="NOA" address="0x00009888" value="0x005A8000" />
+        <register type="NOA" address="0x00009888" value="0x025AC000" />
+        <register type="NOA" address="0x00009888" value="0x045A4000" />
+        <register type="NOA" address="0x00009888" value="0x0A5B4000" />
+        <register type="NOA" address="0x00009888" value="0x001D8000" />
+        <register type="NOA" address="0x00009888" value="0x021DC000" />
+        <register type="NOA" address="0x00009888" value="0x041D4000" />
+        <register type="NOA" address="0x00009888" value="0x0C1FA000" />
+        <register type="NOA" address="0x00009888" value="0x0E1F002A" />
+        <register type="NOA" address="0x00009888" value="0x0A384000" />
+        <register type="NOA" address="0x00009888" value="0x00394000" />
+        <register type="NOA" address="0x00009888" value="0x02395000" />
+        <register type="NOA" address="0x00009888" value="0x04399000" />
+        <register type="NOA" address="0x00009888" value="0x069B0034" />
+        <register type="NOA" address="0x00009888" value="0x109B0000" />
+        <register type="NOA" address="0x00009888" value="0x06DC4000" />
+        <register type="NOA" address="0x00009888" value="0x0CBD4000" />
+        <register type="NOA" address="0x00009888" value="0x0CBF0981" />
+        <register type="NOA" address="0x00009888" value="0x0EBF0A0F" />
+        <register type="NOA" address="0x00009888" value="0x06D84000" />
+        <register type="NOA" address="0x00009888" value="0x0CDAC000" />
+        <register type="NOA" address="0x00009888" value="0x0EDAC000" />
+        <register type="NOA" address="0x00009888" value="0x0CDB4000" />
+        <register type="NOA" address="0x00009888" value="0x0C9DC000" />
+        <register type="NOA" address="0x00009888" value="0x0E9DC000" />
+        <register type="NOA" address="0x00009888" value="0x109F02A8" />
+        <register type="NOA" address="0x00009888" value="0x0E9F0080" />
+        <register type="NOA" address="0x00009888" value="0x0CB84000" />
+        <register type="NOA" address="0x00009888" value="0x0CB95000" />
+        <register type="NOA" address="0x00009888" value="0x0EB95000" />
+        <register type="NOA" address="0x00009888" value="0x06B92000" />
+        <register type="NOA" address="0x00009888" value="0x0F88000F" />
+        <register type="NOA" address="0x00009888" value="0x0D880400" />
+        <register type="NOA" address="0x00009888" value="0x038A8000" />
+        <register type="NOA" address="0x00009888" value="0x058A8000" />
+        <register type="NOA" address="0x00009888" value="0x078A8000" />
+        <register type="NOA" address="0x00009888" value="0x098A8000" />
+        <register type="NOA" address="0x00009888" value="0x0B8A8000" />
+        <register type="NOA" address="0x00009888" value="0x258B8009" />
+        <register type="NOA" address="0x00009888" value="0x278B002A" />
+        <register type="NOA" address="0x00009888" value="0x238B2A80" />
+        <register type="NOA" address="0x00009888" value="0x198C4000" />
+        <register type="NOA" address="0x00009888" value="0x1B8C0015" />
+        <register type="NOA" address="0x00009888" value="0x0D8C4000" />
+        <register type="NOA" address="0x00009888" value="0x0D8DA000" />
+        <register type="NOA" address="0x00009888" value="0x0F8DA000" />
+        <register type="NOA" address="0x00009888" value="0x078D2000" />
+        <register type="NOA" address="0x00009888" value="0x2185800A" />
+        <register type="NOA" address="0x00009888" value="0x2385002A" />
+        <register type="NOA" address="0x00009888" value="0x1F85AA00" />
+        <register type="NOA" address="0x00009888" value="0x1B830154" />
+        <register type="NOA" address="0x00009888" value="0x03834000" />
+        <register type="NOA" address="0x00009888" value="0x05834000" />
+        <register type="NOA" address="0x00009888" value="0x07834000" />
+        <register type="NOA" address="0x00009888" value="0x09834000" />
+        <register type="NOA" address="0x00009888" value="0x0B834000" />
+        <register type="NOA" address="0x00009888" value="0x0D834000" />
+        <register type="NOA" address="0x00009888" value="0x0D84C000" />
+        <register type="NOA" address="0x00009888" value="0x0F84C000" />
+        <register type="NOA" address="0x00009888" value="0x01848000" />
+        <register type="NOA" address="0x00009888" value="0x0384C000" />
+        <register type="NOA" address="0x00009888" value="0x0584C000" />
+        <register type="NOA" address="0x00009888" value="0x07844000" />
+        <register type="NOA" address="0x00009888" value="0x1D80C000" />
+        <register type="NOA" address="0x00009888" value="0x1F80C000" />
+        <register type="NOA" address="0x00009888" value="0x11808000" />
+        <register type="NOA" address="0x00009888" value="0x1380C000" />
+        <register type="NOA" address="0x00009888" value="0x1580C000" />
+        <register type="NOA" address="0x00009888" value="0x17804000" />
+        <register type="NOA" address="0x00009888" value="0x53800000" />
+        <register type="NOA" address="0x00009888" value="0x45800C00" />
+        <register type="NOA" address="0x00009888" value="0x47800C63" />
+        <register type="NOA" address="0x00009888" value="0x21800000" />
+        <register type="NOA" address="0x00009888" value="0x31800000" />
+        <register type="NOA" address="0x00009888" value="0x4D800000" />
+        <register type="NOA" address="0x00009888" value="0x3F8014A5" />
+        <register type="NOA" address="0x00009888" value="0x4F800000" />
+        <register type="NOA" address="0x00009888" value="0x41800045" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002770" value="0x00100070" />
+        <register type="OA" address="0x00002774" value="0x0000FFF1" />
+        <register type="OA" address="0x00002778" value="0x00014002" />
+        <register type="OA" address="0x0000277C" value="0x0000C3FF" />
+        <register type="OA" address="0x00002780" value="0x00010002" />
+        <register type="OA" address="0x00002784" value="0x0000C7FF" />
+        <register type="OA" address="0x00002788" value="0x00004002" />
+        <register type="OA" address="0x0000278C" value="0x0000D3FF" />
+        <register type="OA" address="0x00002790" value="0x00100700" />
+        <register type="OA" address="0x00002794" value="0x0000FF1F" />
+        <register type="OA" address="0x00002798" value="0x00001402" />
+        <register type="OA" address="0x0000279C" value="0x0000FC3F" />
+        <register type="OA" address="0x000027A0" value="0x00001002" />
+        <register type="OA" address="0x000027A4" value="0x0000FC7F" />
+        <register type="OA" address="0x000027A8" value="0x00000402" />
+        <register type="OA" address="0x000027AC" value="0x0000FD3F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set L3_4"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="l3_4"
+       hw_config_guid="be74c9d6-268f-4d7f-b2e8-8d91d4441883"
+       chipset="CHV"
+       symbol_name="L3_4"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank2 Stalled"
+             description="The percentage of time in which slice0 L3 bank2 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank2_stalled"
+             units="percent"
+             symbol_name="L30Bank2Stalled"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice1 L3 Bank2 Active"
+             description="The percentage of time in which slice1 L3 bank2 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l31_bank2_active"
+             units="percent"
+             symbol_name="L31Bank2Active"
+             availability="$SliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Slice0 L3 Bank2 Active"
+             description="The percentage of time in which slice0 L3 bank2 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank2_active"
+             units="percent"
+             symbol_name="L30Bank2Active"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="Slice1 L3 Bank2 Stalled"
+             description="The percentage of time in which slice1 L3 bank2 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l31_bank2_stalled"
+             units="percent"
+             symbol_name="L31Bank2Stalled"
+             availability="$SliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL 2 UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x121A0340" />
+        <register type="NOA" address="0x00009888" value="0x103F0017" />
+        <register type="NOA" address="0x00009888" value="0x123F0020" />
+        <register type="NOA" address="0x00009888" value="0x129A0340" />
+        <register type="NOA" address="0x00009888" value="0x10BF0017" />
+        <register type="NOA" address="0x00009888" value="0x12BF0020" />
+        <register type="NOA" address="0x00009888" value="0x041A3400" />
+        <register type="NOA" address="0x00009888" value="0x101A0000" />
+        <register type="NOA" address="0x00009888" value="0x043B8000" />
+        <register type="NOA" address="0x00009888" value="0x0A3E0010" />
+        <register type="NOA" address="0x00009888" value="0x003F0200" />
+        <register type="NOA" address="0x00009888" value="0x023F0113" />
+        <register type="NOA" address="0x00009888" value="0x043F0014" />
+        <register type="NOA" address="0x00009888" value="0x02592000" />
+        <register type="NOA" address="0x00009888" value="0x005A8000" />
+        <register type="NOA" address="0x00009888" value="0x025AC000" />
+        <register type="NOA" address="0x00009888" value="0x045A4000" />
+        <register type="NOA" address="0x00009888" value="0x0A1C8000" />
+        <register type="NOA" address="0x00009888" value="0x001D8000" />
+        <register type="NOA" address="0x00009888" value="0x021DC000" />
+        <register type="NOA" address="0x00009888" value="0x041D4000" />
+        <register type="NOA" address="0x00009888" value="0x0A1E8000" />
+        <register type="NOA" address="0x00009888" value="0x0C1FA000" />
+        <register type="NOA" address="0x00009888" value="0x0E1F001A" />
+        <register type="NOA" address="0x00009888" value="0x00394000" />
+        <register type="NOA" address="0x00009888" value="0x02395000" />
+        <register type="NOA" address="0x00009888" value="0x04391000" />
+        <register type="NOA" address="0x00009888" value="0x069A0034" />
+        <register type="NOA" address="0x00009888" value="0x109A0000" />
+        <register type="NOA" address="0x00009888" value="0x06BB4000" />
+        <register type="NOA" address="0x00009888" value="0x0ABE0040" />
+        <register type="NOA" address="0x00009888" value="0x0CBF0984" />
+        <register type="NOA" address="0x00009888" value="0x0EBF0A02" />
+        <register type="NOA" address="0x00009888" value="0x02D94000" />
+        <register type="NOA" address="0x00009888" value="0x0CDAC000" />
+        <register type="NOA" address="0x00009888" value="0x0EDAC000" />
+        <register type="NOA" address="0x00009888" value="0x0C9C0400" />
+        <register type="NOA" address="0x00009888" value="0x0C9DC000" />
+        <register type="NOA" address="0x00009888" value="0x0E9DC000" />
+        <register type="NOA" address="0x00009888" value="0x0C9E0400" />
+        <register type="NOA" address="0x00009888" value="0x109F02A8" />
+        <register type="NOA" address="0x00009888" value="0x0E9F0040" />
+        <register type="NOA" address="0x00009888" value="0x0CB95000" />
+        <register type="NOA" address="0x00009888" value="0x0EB95000" />
+        <register type="NOA" address="0x00009888" value="0x0F88000F" />
+        <register type="NOA" address="0x00009888" value="0x0D880400" />
+        <register type="NOA" address="0x00009888" value="0x038A8000" />
+        <register type="NOA" address="0x00009888" value="0x058A8000" />
+        <register type="NOA" address="0x00009888" value="0x078A8000" />
+        <register type="NOA" address="0x00009888" value="0x098A8000" />
+        <register type="NOA" address="0x00009888" value="0x0B8A8000" />
+        <register type="NOA" address="0x00009888" value="0x258B8009" />
+        <register type="NOA" address="0x00009888" value="0x278B002A" />
+        <register type="NOA" address="0x00009888" value="0x238B2A80" />
+        <register type="NOA" address="0x00009888" value="0x198C4000" />
+        <register type="NOA" address="0x00009888" value="0x1B8C0015" />
+        <register type="NOA" address="0x00009888" value="0x0D8C4000" />
+        <register type="NOA" address="0x00009888" value="0x0D8DA000" />
+        <register type="NOA" address="0x00009888" value="0x0F8DA000" />
+        <register type="NOA" address="0x00009888" value="0x078D2000" />
+        <register type="NOA" address="0x00009888" value="0x2185800A" />
+        <register type="NOA" address="0x00009888" value="0x2385002A" />
+        <register type="NOA" address="0x00009888" value="0x1F85AA00" />
+        <register type="NOA" address="0x00009888" value="0x1B830154" />
+        <register type="NOA" address="0x00009888" value="0x03834000" />
+        <register type="NOA" address="0x00009888" value="0x05834000" />
+        <register type="NOA" address="0x00009888" value="0x07834000" />
+        <register type="NOA" address="0x00009888" value="0x09834000" />
+        <register type="NOA" address="0x00009888" value="0x0B834000" />
+        <register type="NOA" address="0x00009888" value="0x0D834000" />
+        <register type="NOA" address="0x00009888" value="0x0D84C000" />
+        <register type="NOA" address="0x00009888" value="0x0F84C000" />
+        <register type="NOA" address="0x00009888" value="0x01848000" />
+        <register type="NOA" address="0x00009888" value="0x0384C000" />
+        <register type="NOA" address="0x00009888" value="0x0584C000" />
+        <register type="NOA" address="0x00009888" value="0x07844000" />
+        <register type="NOA" address="0x00009888" value="0x1D80C000" />
+        <register type="NOA" address="0x00009888" value="0x1F80C000" />
+        <register type="NOA" address="0x00009888" value="0x11808000" />
+        <register type="NOA" address="0x00009888" value="0x1380C000" />
+        <register type="NOA" address="0x00009888" value="0x1580C000" />
+        <register type="NOA" address="0x00009888" value="0x17804000" />
+        <register type="NOA" address="0x00009888" value="0x53800000" />
+        <register type="NOA" address="0x00009888" value="0x45800800" />
+        <register type="NOA" address="0x00009888" value="0x47800842" />
+        <register type="NOA" address="0x00009888" value="0x21800000" />
+        <register type="NOA" address="0x00009888" value="0x31800000" />
+        <register type="NOA" address="0x00009888" value="0x4D800000" />
+        <register type="NOA" address="0x00009888" value="0x3F801084" />
+        <register type="NOA" address="0x00009888" value="0x4F800000" />
+        <register type="NOA" address="0x00009888" value="0x41800044" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002770" value="0x00100070" />
+        <register type="OA" address="0x00002774" value="0x0000FFF1" />
+        <register type="OA" address="0x00002778" value="0x00014002" />
+        <register type="OA" address="0x0000277C" value="0x0000C3FF" />
+        <register type="OA" address="0x00002780" value="0x00010002" />
+        <register type="OA" address="0x00002784" value="0x0000C7FF" />
+        <register type="OA" address="0x00002788" value="0x00004002" />
+        <register type="OA" address="0x0000278C" value="0x0000D3FF" />
+        <register type="OA" address="0x00002790" value="0x00100700" />
+        <register type="OA" address="0x00002794" value="0x0000FF1F" />
+        <register type="OA" address="0x00002798" value="0x00001402" />
+        <register type="OA" address="0x0000279C" value="0x0000FC3F" />
+        <register type="OA" address="0x000027A0" value="0x00001002" />
+        <register type="OA" address="0x000027A4" value="0x0000FC7F" />
+        <register type="OA" address="0x000027A8" value="0x00000402" />
+        <register type="OA" address="0x000027AC" value="0x0000FD3F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set RasterizerAndPixelBackend"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="rasterizer_and_pixel_backend"
+       hw_config_guid="31bc1ff3-8d09-4497-9d79-59c4f943b502"
+       chipset="CHV"
+       symbol_name="RasterizerAndPixelBackend"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice1 Rasterizer Input Available"
+             description="The percentage of time in which slice1 rasterizer input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="rasterizer1_input_available"
+             units="percent"
+             symbol_name="Rasterizer1InputAvailable"
+             availability="$SliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Slice0 Pixel Values Ready"
+             description="The percentage of time in which slice0 pixel values are ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="pixel_values0_ready"
+             units="percent"
+             symbol_name="PixelValues0Ready"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="Slice0 Rasterizer Input Available"
+             description="The percentage of time in which slice0 rasterizer input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="rasterizer0_input_available"
+             units="percent"
+             symbol_name="Rasterizer0InputAvailable"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Slice0 Post-EarlyZ Pixel Data Ready"
+             description="The percentage of time in which slice0 post-EarlyZ pixel data is ready (after early Z tests have been applied))"
+             data_type="float"
+             max_equation="100"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="pixel_data0_ready"
+             units="percent"
+             symbol_name="PixelData0Ready"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer/Early Depth Test"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice1 Pixel Values Ready"
+             description="The percentage of time in which slice1 pixel values are ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="pixel_values1_ready"
+             units="percent"
+             symbol_name="PixelValues1Ready"
+             availability="$SliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Slice1 PS Output Available"
+             description="The percentage of time in which slice1 PS output is available"
+             data_type="float"
+             max_equation="100"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_output1_available"
+             units="percent"
+             symbol_name="PSOutput1Available"
+             availability="$SliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 Rasterizer Output Ready"
+             description="The percentage of time in which slice0 rasterizer output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="rasterizer0_output_ready"
+             units="percent"
+             symbol_name="Rasterizer0OutputReady"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Slice1 Rasterizer Output Ready"
+             description="The percentage of time in which slice1 rasterizer output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="rasterizer1_output_ready"
+             units="percent"
+             symbol_name="Rasterizer1OutputReady"
+             availability="$SliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Slice1 Post-EarlyZ Pixel Data Ready"
+             description="The percentage of time in which slice1 post-EarlyZ pixel data is ready (after early Z tests have been applied)"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="pixel_data1_ready"
+             units="percent"
+             symbol_name="PixelData1Ready"
+             availability="$SliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer/Early Depth Test"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL 2 UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Slice0 PS Output Available"
+             description="The percentage of time in which slice0 PS output is available"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_output0_available"
+             units="percent"
+             symbol_name="PSOutput0Available"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x143B000E" />
+        <register type="NOA" address="0x00009888" value="0x043C55C0" />
+        <register type="NOA" address="0x00009888" value="0x0A1E0280" />
+        <register type="NOA" address="0x00009888" value="0x0C1E0408" />
+        <register type="NOA" address="0x00009888" value="0x10390000" />
+        <register type="NOA" address="0x00009888" value="0x12397A1F" />
+        <register type="NOA" address="0x00009888" value="0x14BB000E" />
+        <register type="NOA" address="0x00009888" value="0x04BC5000" />
+        <register type="NOA" address="0x00009888" value="0x0A9E0296" />
+        <register type="NOA" address="0x00009888" value="0x0C9E0008" />
+        <register type="NOA" address="0x00009888" value="0x10B90000" />
+        <register type="NOA" address="0x00009888" value="0x12B97A1F" />
+        <register type="NOA" address="0x00009888" value="0x063B0042" />
+        <register type="NOA" address="0x00009888" value="0x103B0000" />
+        <register type="NOA" address="0x00009888" value="0x083C0000" />
+        <register type="NOA" address="0x00009888" value="0x0A3E0040" />
+        <register type="NOA" address="0x00009888" value="0x043F8000" />
+        <register type="NOA" address="0x00009888" value="0x02594000" />
+        <register type="NOA" address="0x00009888" value="0x045A8000" />
+        <register type="NOA" address="0x00009888" value="0x0C1C0400" />
+        <register type="NOA" address="0x00009888" value="0x041D8000" />
+        <register type="NOA" address="0x00009888" value="0x081E02C0" />
+        <register type="NOA" address="0x00009888" value="0x0E1E0000" />
+        <register type="NOA" address="0x00009888" value="0x0C1FA800" />
+        <register type="NOA" address="0x00009888" value="0x0E1F0260" />
+        <register type="NOA" address="0x00009888" value="0x101F0014" />
+        <register type="NOA" address="0x00009888" value="0x003905E0" />
+        <register type="NOA" address="0x00009888" value="0x06390BC0" />
+        <register type="NOA" address="0x00009888" value="0x02390018" />
+        <register type="NOA" address="0x00009888" value="0x04394000" />
+        <register type="NOA" address="0x00009888" value="0x04BB0042" />
+        <register type="NOA" address="0x00009888" value="0x10BB0000" />
+        <register type="NOA" address="0x00009888" value="0x02BC05C0" />
+        <register type="NOA" address="0x00009888" value="0x08BC0000" />
+        <register type="NOA" address="0x00009888" value="0x0ABE0004" />
+        <register type="NOA" address="0x00009888" value="0x02BF8000" />
+        <register type="NOA" address="0x00009888" value="0x02D91000" />
+        <register type="NOA" address="0x00009888" value="0x02DA8000" />
+        <register type="NOA" address="0x00009888" value="0x089C8000" />
+        <register type="NOA" address="0x00009888" value="0x029D8000" />
+        <register type="NOA" address="0x00009888" value="0x089E8000" />
+        <register type="NOA" address="0x00009888" value="0x0E9E0000" />
+        <register type="NOA" address="0x00009888" value="0x0E9FA806" />
+        <register type="NOA" address="0x00009888" value="0x109F0142" />
+        <register type="NOA" address="0x00009888" value="0x08B90617" />
+        <register type="NOA" address="0x00009888" value="0x0AB90BE0" />
+        <register type="NOA" address="0x00009888" value="0x02B94000" />
+        <register type="NOA" address="0x00009888" value="0x0D88F000" />
+        <register type="NOA" address="0x00009888" value="0x0F88000C" />
+        <register type="NOA" address="0x00009888" value="0x07888000" />
+        <register type="NOA" address="0x00009888" value="0x09888000" />
+        <register type="NOA" address="0x00009888" value="0x018A8000" />
+        <register type="NOA" address="0x00009888" value="0x0F8A8000" />
+        <register type="NOA" address="0x00009888" value="0x1B8A2800" />
+        <register type="NOA" address="0x00009888" value="0x038A8000" />
+        <register type="NOA" address="0x00009888" value="0x058A8000" />
+        <register type="NOA" address="0x00009888" value="0x0B8A8000" />
+        <register type="NOA" address="0x00009888" value="0x0D8A8000" />
+        <register type="NOA" address="0x00009888" value="0x238B52A0" />
+        <register type="NOA" address="0x00009888" value="0x258B6A95" />
+        <register type="NOA" address="0x00009888" value="0x278B0029" />
+        <register type="NOA" address="0x00009888" value="0x178C2000" />
+        <register type="NOA" address="0x00009888" value="0x198C1500" />
+        <register type="NOA" address="0x00009888" value="0x1B8C0014" />
+        <register type="NOA" address="0x00009888" value="0x078C4000" />
+        <register type="NOA" address="0x00009888" value="0x098C4000" />
+        <register type="NOA" address="0x00009888" value="0x098DA000" />
+        <register type="NOA" address="0x00009888" value="0x0B8DA000" />
+        <register type="NOA" address="0x00009888" value="0x0F8DA000" />
+        <register type="NOA" address="0x00009888" value="0x038D8000" />
+        <register type="NOA" address="0x00009888" value="0x058D2000" />
+        <register type="NOA" address="0x00009888" value="0x1F85AA80" />
+        <register type="NOA" address="0x00009888" value="0x2185AAAA" />
+        <register type="NOA" address="0x00009888" value="0x2385002A" />
+        <register type="NOA" address="0x00009888" value="0x01834000" />
+        <register type="NOA" address="0x00009888" value="0x0F834000" />
+        <register type="NOA" address="0x00009888" value="0x19835400" />
+        <register type="NOA" address="0x00009888" value="0x1B830155" />
+        <register type="NOA" address="0x00009888" value="0x03834000" />
+        <register type="NOA" address="0x00009888" value="0x05834000" />
+        <register type="NOA" address="0x00009888" value="0x07834000" />
+        <register type="NOA" address="0x00009888" value="0x09834000" />
+        <register type="NOA" address="0x00009888" value="0x0B834000" />
+        <register type="NOA" address="0x00009888" value="0x0D834000" />
+        <register type="NOA" address="0x00009888" value="0x0184C000" />
+        <register type="NOA" address="0x00009888" value="0x0784C000" />
+        <register type="NOA" address="0x00009888" value="0x0984C000" />
+        <register type="NOA" address="0x00009888" value="0x0B84C000" />
+        <register type="NOA" address="0x00009888" value="0x0D84C000" />
+        <register type="NOA" address="0x00009888" value="0x0F84C000" />
+        <register type="NOA" address="0x00009888" value="0x0384C000" />
+        <register type="NOA" address="0x00009888" value="0x0584C000" />
+        <register type="NOA" address="0x00009888" value="0x1180C000" />
+        <register type="NOA" address="0x00009888" value="0x1780C000" />
+        <register type="NOA" address="0x00009888" value="0x1980C000" />
+        <register type="NOA" address="0x00009888" value="0x1B80C000" />
+        <register type="NOA" address="0x00009888" value="0x1D80C000" />
+        <register type="NOA" address="0x00009888" value="0x1F80C000" />
+        <register type="NOA" address="0x00009888" value="0x1380C000" />
+        <register type="NOA" address="0x00009888" value="0x1580C000" />
+        <register type="NOA" address="0x00009888" value="0x4D800444" />
+        <register type="NOA" address="0x00009888" value="0x3D800000" />
+        <register type="NOA" address="0x00009888" value="0x4F804000" />
+        <register type="NOA" address="0x00009888" value="0x43801080" />
+        <register type="NOA" address="0x00009888" value="0x51800000" />
+        <register type="NOA" address="0x00009888" value="0x45800084" />
+        <register type="NOA" address="0x00009888" value="0x53800044" />
+        <register type="NOA" address="0x00009888" value="0x47801080" />
+        <register type="NOA" address="0x00009888" value="0x21800000" />
+        <register type="NOA" address="0x00009888" value="0x31800000" />
+        <register type="NOA" address="0x00009888" value="0x3F800000" />
+        <register type="NOA" address="0x00009888" value="0x41800840" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x30800000" />
+        <register type="OA" address="0x00002770" value="0x00006000" />
+        <register type="OA" address="0x00002774" value="0x0000F3FF" />
+        <register type="OA" address="0x00002778" value="0x00001800" />
+        <register type="OA" address="0x0000277C" value="0x0000FCFF" />
+        <register type="OA" address="0x00002780" value="0x00000600" />
+        <register type="OA" address="0x00002784" value="0x0000FF3F" />
+        <register type="OA" address="0x00002788" value="0x00000180" />
+        <register type="OA" address="0x0000278C" value="0x0000FFCF" />
+        <register type="OA" address="0x00002790" value="0x00000060" />
+        <register type="OA" address="0x00002794" value="0x0000FFF3" />
+        <register type="OA" address="0x00002798" value="0x00000018" />
+        <register type="OA" address="0x0000279C" value="0x0000FFFC" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set Sampler_1"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="sampler_1"
+       hw_config_guid="05450fec-bb5c-4b0a-8995-e03631168a34"
+       chipset="CHV"
+       symbol_name="Sampler_1"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Slice1 Subslice0 Input Available"
+             description="The percentage of time in which slice1 subslice0 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler10_input_available"
+             units="percent"
+             symbol_name="Sampler10InputAvailable"
+             availability="$SubsliceMask 0x8 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Slice1 Subslice2 Sampler Output Ready"
+             description="The percentage of time in which slice1 subslice2 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler12_output_ready"
+             units="percent"
+             symbol_name="Sampler12OutputReady"
+             availability="$SubsliceMask 0x20 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice1 Subslice1 Input Available"
+             description="The percentage of time in which slice1 subslice1 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler11_input_available"
+             units="percent"
+             symbol_name="Sampler11InputAvailable"
+             availability="$SubsliceMask 0x10 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Slice1 Subslice2 Input Available"
+             description="The percentage of time in which slice1 subslice2 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler12_input_available"
+             units="percent"
+             symbol_name="Sampler12InputAvailable"
+             availability="$SubsliceMask 0x20 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Slice1 Subslice0 Sampler Output Ready"
+             description="The percentage of time in which slice1 subslice0 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler10_output_ready"
+             units="percent"
+             symbol_name="Sampler10OutputReady"
+             availability="$SubsliceMask 0x8 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Slice1 Subslice1 Sampler Output Ready"
+             description="The percentage of time in which slice1 subslice1 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler11_output_ready"
+             units="percent"
+             symbol_name="Sampler11OutputReady"
+             availability="$SubsliceMask 0x10 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL 2 UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x18921400" />
+        <register type="NOA" address="0x00009888" value="0x149500AB" />
+        <register type="NOA" address="0x00009888" value="0x18B21400" />
+        <register type="NOA" address="0x00009888" value="0x14B500AB" />
+        <register type="NOA" address="0x00009888" value="0x18D21400" />
+        <register type="NOA" address="0x00009888" value="0x14D500AB" />
+        <register type="NOA" address="0x00009888" value="0x0CDC8000" />
+        <register type="NOA" address="0x00009888" value="0x0EDC4000" />
+        <register type="NOA" address="0x00009888" value="0x02DCC000" />
+        <register type="NOA" address="0x00009888" value="0x04DCC000" />
+        <register type="NOA" address="0x00009888" value="0x1ABD00A0" />
+        <register type="NOA" address="0x00009888" value="0x0ABD8000" />
+        <register type="NOA" address="0x00009888" value="0x0CD88000" />
+        <register type="NOA" address="0x00009888" value="0x0ED84000" />
+        <register type="NOA" address="0x00009888" value="0x04D88000" />
+        <register type="NOA" address="0x00009888" value="0x1ADB0050" />
+        <register type="NOA" address="0x00009888" value="0x04DB8000" />
+        <register type="NOA" address="0x00009888" value="0x06DB8000" />
+        <register type="NOA" address="0x00009888" value="0x08DB8000" />
+        <register type="NOA" address="0x00009888" value="0x0ADB4000" />
+        <register type="NOA" address="0x00009888" value="0x109F02A0" />
+        <register type="NOA" address="0x00009888" value="0x0C9FA000" />
+        <register type="NOA" address="0x00009888" value="0x0E9F00AA" />
+        <register type="NOA" address="0x00009888" value="0x18B82500" />
+        <register type="NOA" address="0x00009888" value="0x02B88000" />
+        <register type="NOA" address="0x00009888" value="0x04B84000" />
+        <register type="NOA" address="0x00009888" value="0x06B84000" />
+        <register type="NOA" address="0x00009888" value="0x08B84000" />
+        <register type="NOA" address="0x00009888" value="0x0AB84000" />
+        <register type="NOA" address="0x00009888" value="0x0CB88000" />
+        <register type="NOA" address="0x00009888" value="0x0CB98000" />
+        <register type="NOA" address="0x00009888" value="0x0EB9A000" />
+        <register type="NOA" address="0x00009888" value="0x00B98000" />
+        <register type="NOA" address="0x00009888" value="0x02B9A000" />
+        <register type="NOA" address="0x00009888" value="0x04B9A000" />
+        <register type="NOA" address="0x00009888" value="0x06B92000" />
+        <register type="NOA" address="0x00009888" value="0x1ABA0200" />
+        <register type="NOA" address="0x00009888" value="0x02BA8000" />
+        <register type="NOA" address="0x00009888" value="0x0CBA8000" />
+        <register type="NOA" address="0x00009888" value="0x04908000" />
+        <register type="NOA" address="0x00009888" value="0x04918000" />
+        <register type="NOA" address="0x00009888" value="0x04927300" />
+        <register type="NOA" address="0x00009888" value="0x10920000" />
+        <register type="NOA" address="0x00009888" value="0x1893000A" />
+        <register type="NOA" address="0x00009888" value="0x0A934000" />
+        <register type="NOA" address="0x00009888" value="0x0A946000" />
+        <register type="NOA" address="0x00009888" value="0x0C959000" />
+        <register type="NOA" address="0x00009888" value="0x0E950098" />
+        <register type="NOA" address="0x00009888" value="0x10950000" />
+        <register type="NOA" address="0x00009888" value="0x04B04000" />
+        <register type="NOA" address="0x00009888" value="0x04B14000" />
+        <register type="NOA" address="0x00009888" value="0x04B20073" />
+        <register type="NOA" address="0x00009888" value="0x10B20000" />
+        <register type="NOA" address="0x00009888" value="0x04B38000" />
+        <register type="NOA" address="0x00009888" value="0x06B38000" />
+        <register type="NOA" address="0x00009888" value="0x08B34000" />
+        <register type="NOA" address="0x00009888" value="0x04B4C000" />
+        <register type="NOA" address="0x00009888" value="0x02B59890" />
+        <register type="NOA" address="0x00009888" value="0x10B50000" />
+        <register type="NOA" address="0x00009888" value="0x06D04000" />
+        <register type="NOA" address="0x00009888" value="0x06D14000" />
+        <register type="NOA" address="0x00009888" value="0x06D20073" />
+        <register type="NOA" address="0x00009888" value="0x10D20000" />
+        <register type="NOA" address="0x00009888" value="0x18D30020" />
+        <register type="NOA" address="0x00009888" value="0x02D38000" />
+        <register type="NOA" address="0x00009888" value="0x0CD34000" />
+        <register type="NOA" address="0x00009888" value="0x0AD48000" />
+        <register type="NOA" address="0x00009888" value="0x04D42000" />
+        <register type="NOA" address="0x00009888" value="0x0ED59000" />
+        <register type="NOA" address="0x00009888" value="0x00D59800" />
+        <register type="NOA" address="0x00009888" value="0x10D50000" />
+        <register type="NOA" address="0x00009888" value="0x0F88000E" />
+        <register type="NOA" address="0x00009888" value="0x03888000" />
+        <register type="NOA" address="0x00009888" value="0x05888000" />
+        <register type="NOA" address="0x00009888" value="0x07888000" />
+        <register type="NOA" address="0x00009888" value="0x09888000" />
+        <register type="NOA" address="0x00009888" value="0x0B888000" />
+        <register type="NOA" address="0x00009888" value="0x0D880400" />
+        <register type="NOA" address="0x00009888" value="0x278B002A" />
+        <register type="NOA" address="0x00009888" value="0x238B5500" />
+        <register type="NOA" address="0x00009888" value="0x258B000A" />
+        <register type="NOA" address="0x00009888" value="0x1B8C0015" />
+        <register type="NOA" address="0x00009888" value="0x038C4000" />
+        <register type="NOA" address="0x00009888" value="0x058C4000" />
+        <register type="NOA" address="0x00009888" value="0x078C4000" />
+        <register type="NOA" address="0x00009888" value="0x098C4000" />
+        <register type="NOA" address="0x00009888" value="0x0B8C4000" />
+        <register type="NOA" address="0x00009888" value="0x0D8C4000" />
+        <register type="NOA" address="0x00009888" value="0x0D8D8000" />
+        <register type="NOA" address="0x00009888" value="0x0F8DA000" />
+        <register type="NOA" address="0x00009888" value="0x018D8000" />
+        <register type="NOA" address="0x00009888" value="0x038DA000" />
+        <register type="NOA" address="0x00009888" value="0x058DA000" />
+        <register type="NOA" address="0x00009888" value="0x078D2000" />
+        <register type="NOA" address="0x00009888" value="0x2385002A" />
+        <register type="NOA" address="0x00009888" value="0x1F85AA00" />
+        <register type="NOA" address="0x00009888" value="0x2185000A" />
+        <register type="NOA" address="0x00009888" value="0x1B830150" />
+        <register type="NOA" address="0x00009888" value="0x03834000" />
+        <register type="NOA" address="0x00009888" value="0x05834000" />
+        <register type="NOA" address="0x00009888" value="0x07834000" />
+        <register type="NOA" address="0x00009888" value="0x09834000" />
+        <register type="NOA" address="0x00009888" value="0x0B834000" />
+        <register type="NOA" address="0x00009888" value="0x0D834000" />
+        <register type="NOA" address="0x00009888" value="0x0D848000" />
+        <register type="NOA" address="0x00009888" value="0x0F84C000" />
+        <register type="NOA" address="0x00009888" value="0x01848000" />
+        <register type="NOA" address="0x00009888" value="0x0384C000" />
+        <register type="NOA" address="0x00009888" value="0x0584C000" />
+        <register type="NOA" address="0x00009888" value="0x07844000" />
+        <register type="NOA" address="0x00009888" value="0x1D808000" />
+        <register type="NOA" address="0x00009888" value="0x1F80C000" />
+        <register type="NOA" address="0x00009888" value="0x11808000" />
+        <register type="NOA" address="0x00009888" value="0x1380C000" />
+        <register type="NOA" address="0x00009888" value="0x1580C000" />
+        <register type="NOA" address="0x00009888" value="0x17804000" />
+        <register type="NOA" address="0x00009888" value="0x53800000" />
+        <register type="NOA" address="0x00009888" value="0x47801021" />
+        <register type="NOA" address="0x00009888" value="0x21800000" />
+        <register type="NOA" address="0x00009888" value="0x31800000" />
+        <register type="NOA" address="0x00009888" value="0x4D800000" />
+        <register type="NOA" address="0x00009888" value="0x3F800C64" />
+        <register type="NOA" address="0x00009888" value="0x4F800000" />
+        <register type="NOA" address="0x00009888" value="0x41800C02" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x70800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x0000C000" />
+        <register type="OA" address="0x00002774" value="0x0000E7FF" />
+        <register type="OA" address="0x00002778" value="0x00003000" />
+        <register type="OA" address="0x0000277C" value="0x0000F9FF" />
+        <register type="OA" address="0x00002780" value="0x00000C00" />
+        <register type="OA" address="0x00002784" value="0x0000FE7F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set Sampler_2"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="sampler_2"
+       hw_config_guid="883c8a56-8767-4de8-beec-a99462c6674b"
+       chipset="CHV"
+       symbol_name="Sampler_2"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 Subslice2 Input Available"
+             description="The percentage of time in which slice0 subslice2 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler02_input_available"
+             units="percent"
+             symbol_name="Sampler02InputAvailable"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 Subslice0 Input Available"
+             description="The percentage of time in which slice0 subslice0 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler00_input_available"
+             units="percent"
+             symbol_name="Sampler00InputAvailable"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="Slice0 Subslice2 Sampler Output Ready"
+             description="The percentage of time in which slice0 subslice2 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler02_output_ready"
+             units="percent"
+             symbol_name="Sampler02OutputReady"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Slice0 Subslice1 Input Available"
+             description="The percentage of time in which slice0 subslice1 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler01_input_available"
+             units="percent"
+             symbol_name="Sampler01InputAvailable"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Slice0 Subslice0 Sampler Output Ready"
+             description="The percentage of time in which slice0 subslice0 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler00_output_ready"
+             units="percent"
+             symbol_name="Sampler00OutputReady"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Slice0 Subslice1 Sampler Output Ready"
+             description="The percentage of time in which slice0 subslice1 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler01_output_ready"
+             units="percent"
+             symbol_name="Sampler01OutputReady"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL 2 UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x18121400" />
+        <register type="NOA" address="0x00009888" value="0x141500AB" />
+        <register type="NOA" address="0x00009888" value="0x18321400" />
+        <register type="NOA" address="0x00009888" value="0x143500AB" />
+        <register type="NOA" address="0x00009888" value="0x18521400" />
+        <register type="NOA" address="0x00009888" value="0x145500AB" />
+        <register type="NOA" address="0x00009888" value="0x0C5C8000" />
+        <register type="NOA" address="0x00009888" value="0x0E5C4000" />
+        <register type="NOA" address="0x00009888" value="0x025CC000" />
+        <register type="NOA" address="0x00009888" value="0x045CC000" />
+        <register type="NOA" address="0x00009888" value="0x1A3D00A0" />
+        <register type="NOA" address="0x00009888" value="0x0A3D8000" />
+        <register type="NOA" address="0x00009888" value="0x0C588000" />
+        <register type="NOA" address="0x00009888" value="0x0E584000" />
+        <register type="NOA" address="0x00009888" value="0x04588000" />
+        <register type="NOA" address="0x00009888" value="0x1A5B0050" />
+        <register type="NOA" address="0x00009888" value="0x045B8000" />
+        <register type="NOA" address="0x00009888" value="0x065B8000" />
+        <register type="NOA" address="0x00009888" value="0x085B8000" />
+        <register type="NOA" address="0x00009888" value="0x0A5B4000" />
+        <register type="NOA" address="0x00009888" value="0x101F02A0" />
+        <register type="NOA" address="0x00009888" value="0x0C1FA000" />
+        <register type="NOA" address="0x00009888" value="0x0E1F00AA" />
+        <register type="NOA" address="0x00009888" value="0x18382500" />
+        <register type="NOA" address="0x00009888" value="0x02388000" />
+        <register type="NOA" address="0x00009888" value="0x04384000" />
+        <register type="NOA" address="0x00009888" value="0x06384000" />
+        <register type="NOA" address="0x00009888" value="0x08384000" />
+        <register type="NOA" address="0x00009888" value="0x0A384000" />
+        <register type="NOA" address="0x00009888" value="0x0C388000" />
+        <register type="NOA" address="0x00009888" value="0x0C398000" />
+        <register type="NOA" address="0x00009888" value="0x0E39A000" />
+        <register type="NOA" address="0x00009888" value="0x00398000" />
+        <register type="NOA" address="0x00009888" value="0x0239A000" />
+        <register type="NOA" address="0x00009888" value="0x0439A000" />
+        <register type="NOA" address="0x00009888" value="0x06392000" />
+        <register type="NOA" address="0x00009888" value="0x1A3A0200" />
+        <register type="NOA" address="0x00009888" value="0x023A8000" />
+        <register type="NOA" address="0x00009888" value="0x0C3A8000" />
+        <register type="NOA" address="0x00009888" value="0x04108000" />
+        <register type="NOA" address="0x00009888" value="0x04118000" />
+        <register type="NOA" address="0x00009888" value="0x04127300" />
+        <register type="NOA" address="0x00009888" value="0x10120000" />
+        <register type="NOA" address="0x00009888" value="0x1813000A" />
+        <register type="NOA" address="0x00009888" value="0x0A134000" />
+        <register type="NOA" address="0x00009888" value="0x0A146000" />
+        <register type="NOA" address="0x00009888" value="0x0C159000" />
+        <register type="NOA" address="0x00009888" value="0x0E150098" />
+        <register type="NOA" address="0x00009888" value="0x10150000" />
+        <register type="NOA" address="0x00009888" value="0x04304000" />
+        <register type="NOA" address="0x00009888" value="0x04314000" />
+        <register type="NOA" address="0x00009888" value="0x04320073" />
+        <register type="NOA" address="0x00009888" value="0x10320000" />
+        <register type="NOA" address="0x00009888" value="0x04338000" />
+        <register type="NOA" address="0x00009888" value="0x06338000" />
+        <register type="NOA" address="0x00009888" value="0x08334000" />
+        <register type="NOA" address="0x00009888" value="0x0434C000" />
+        <register type="NOA" address="0x00009888" value="0x02359890" />
+        <register type="NOA" address="0x00009888" value="0x10350000" />
+        <register type="NOA" address="0x00009888" value="0x06504000" />
+        <register type="NOA" address="0x00009888" value="0x06514000" />
+        <register type="NOA" address="0x00009888" value="0x06520073" />
+        <register type="NOA" address="0x00009888" value="0x10520000" />
+        <register type="NOA" address="0x00009888" value="0x18530020" />
+        <register type="NOA" address="0x00009888" value="0x02538000" />
+        <register type="NOA" address="0x00009888" value="0x0C534000" />
+        <register type="NOA" address="0x00009888" value="0x0A548000" />
+        <register type="NOA" address="0x00009888" value="0x04542000" />
+        <register type="NOA" address="0x00009888" value="0x0E559000" />
+        <register type="NOA" address="0x00009888" value="0x00559800" />
+        <register type="NOA" address="0x00009888" value="0x10550000" />
+        <register type="NOA" address="0x00009888" value="0x1B8AA000" />
+        <register type="NOA" address="0x00009888" value="0x1D8A0002" />
+        <register type="NOA" address="0x00009888" value="0x038A8000" />
+        <register type="NOA" address="0x00009888" value="0x058A8000" />
+        <register type="NOA" address="0x00009888" value="0x078A8000" />
+        <register type="NOA" address="0x00009888" value="0x098A8000" />
+        <register type="NOA" address="0x00009888" value="0x0B8A8000" />
+        <register type="NOA" address="0x00009888" value="0x0D8A8000" />
+        <register type="NOA" address="0x00009888" value="0x278B0015" />
+        <register type="NOA" address="0x00009888" value="0x238B2A80" />
+        <register type="NOA" address="0x00009888" value="0x258B0005" />
+        <register type="NOA" address="0x00009888" value="0x2385002A" />
+        <register type="NOA" address="0x00009888" value="0x1F85AA00" />
+        <register type="NOA" address="0x00009888" value="0x2185000A" />
+        <register type="NOA" address="0x00009888" value="0x1B830150" />
+        <register type="NOA" address="0x00009888" value="0x03834000" />
+        <register type="NOA" address="0x00009888" value="0x05834000" />
+        <register type="NOA" address="0x00009888" value="0x07834000" />
+        <register type="NOA" address="0x00009888" value="0x09834000" />
+        <register type="NOA" address="0x00009888" value="0x0B834000" />
+        <register type="NOA" address="0x00009888" value="0x0D834000" />
+        <register type="NOA" address="0x00009888" value="0x0D848000" />
+        <register type="NOA" address="0x00009888" value="0x0F84C000" />
+        <register type="NOA" address="0x00009888" value="0x01848000" />
+        <register type="NOA" address="0x00009888" value="0x0384C000" />
+        <register type="NOA" address="0x00009888" value="0x0584C000" />
+        <register type="NOA" address="0x00009888" value="0x07844000" />
+        <register type="NOA" address="0x00009888" value="0x1D808000" />
+        <register type="NOA" address="0x00009888" value="0x1F80C000" />
+        <register type="NOA" address="0x00009888" value="0x11808000" />
+        <register type="NOA" address="0x00009888" value="0x1380C000" />
+        <register type="NOA" address="0x00009888" value="0x1580C000" />
+        <register type="NOA" address="0x00009888" value="0x17804000" />
+        <register type="NOA" address="0x00009888" value="0x53800000" />
+        <register type="NOA" address="0x00009888" value="0x47801021" />
+        <register type="NOA" address="0x00009888" value="0x21800000" />
+        <register type="NOA" address="0x00009888" value="0x31800000" />
+        <register type="NOA" address="0x00009888" value="0x4D800000" />
+        <register type="NOA" address="0x00009888" value="0x3F800C64" />
+        <register type="NOA" address="0x00009888" value="0x4F800000" />
+        <register type="NOA" address="0x00009888" value="0x41800C02" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x70800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x0000C000" />
+        <register type="OA" address="0x00002774" value="0x0000E7FF" />
+        <register type="OA" address="0x00002778" value="0x00003000" />
+        <register type="OA" address="0x0000277C" value="0x0000F9FF" />
+        <register type="OA" address="0x00002780" value="0x00000C00" />
+        <register type="OA" address="0x00002784" value="0x0000FE7F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set TDL_1"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="tdl_1"
+       hw_config_guid="eb97e523-d9ac-48a9-b7f8-9cc909ddbf14"
+       chipset="CHV"
+       symbol_name="TDL_1"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice1 Subslice1"
+             description="The percentage of time in which PS thread is ready for dispatch on slice1 subslice1 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread11_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread11ReadyForDispatch"
+             availability="$SubsliceMask 0x10 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="NonPS Thread Ready For Dispatch on Slice1 Subslice2"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice1 subslice2 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread12_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread12ReadyForDispatch"
+             availability="$SubsliceMask 0x20 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="NonPS Thread Ready For Dispatch on Slice1 Subslice0"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice1 subslice0 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread10_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread10ReadyForDispatch"
+             availability="$SubsliceMask 0x8 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice1 Port 0"
+             description="The percentage of time in which thread header is ready on slice0 subslice1 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header01_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader01ReadyPort0"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice1 Port 1"
+             description="The percentage of time in which thread header is ready on slice0 subslice1 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header01_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader01ReadyPort1"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice2 Port 1"
+             description="The percentage of time in which thread header is ready on slice0 subslice2 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header02_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader02ReadyPort1"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice2 Port 0"
+             description="The percentage of time in which thread header is ready on slice0 subslice2 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header02_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader02ReadyPort0"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice1 Subslice2"
+             description="The percentage of time in which PS thread is ready for dispatch on slice1 subslice2 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread12_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread12ReadyForDispatch"
+             availability="$SubsliceMask 0x20 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice1 Subslice0"
+             description="The percentage of time in which PS thread is ready for dispatch on slice1 subslice0 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread10_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread10ReadyForDispatch"
+             availability="$SubsliceMask 0x8 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="NonPS Thread Ready For Dispatch on Slice1 Subslice1"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice1 subslice1 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread11_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread11ReadyForDispatch"
+             availability="$SubsliceMask 0x10 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL 2 UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice0 Port 0"
+             description="The percentage of time in which thread header is ready on slice0 subslice0 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header00_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader00ReadyPort0"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice0 Port 1"
+             description="The percentage of time in which thread header is ready on slice0 subslice0 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header00_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader00ReadyPort1"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x16154D60" />
+        <register type="NOA" address="0x00009888" value="0x16352E60" />
+        <register type="NOA" address="0x00009888" value="0x16554D60" />
+        <register type="NOA" address="0x00009888" value="0x16950000" />
+        <register type="NOA" address="0x00009888" value="0x16B50000" />
+        <register type="NOA" address="0x00009888" value="0x16D50000" />
+        <register type="NOA" address="0x00009888" value="0x005C8000" />
+        <register type="NOA" address="0x00009888" value="0x045CC000" />
+        <register type="NOA" address="0x00009888" value="0x065C4000" />
+        <register type="NOA" address="0x00009888" value="0x083D8000" />
+        <register type="NOA" address="0x00009888" value="0x0A3D8000" />
+        <register type="NOA" address="0x00009888" value="0x0458C000" />
+        <register type="NOA" address="0x00009888" value="0x025B8000" />
+        <register type="NOA" address="0x00009888" value="0x085B4000" />
+        <register type="NOA" address="0x00009888" value="0x0A5B4000" />
+        <register type="NOA" address="0x00009888" value="0x0C5B8000" />
+        <register type="NOA" address="0x00009888" value="0x0C1FA000" />
+        <register type="NOA" address="0x00009888" value="0x0E1F00AA" />
+        <register type="NOA" address="0x00009888" value="0x02384000" />
+        <register type="NOA" address="0x00009888" value="0x04388000" />
+        <register type="NOA" address="0x00009888" value="0x06388000" />
+        <register type="NOA" address="0x00009888" value="0x08384000" />
+        <register type="NOA" address="0x00009888" value="0x0A384000" />
+        <register type="NOA" address="0x00009888" value="0x0C384000" />
+        <register type="NOA" address="0x00009888" value="0x00398000" />
+        <register type="NOA" address="0x00009888" value="0x0239A000" />
+        <register type="NOA" address="0x00009888" value="0x0439A000" />
+        <register type="NOA" address="0x00009888" value="0x06392000" />
+        <register type="NOA" address="0x00009888" value="0x043A8000" />
+        <register type="NOA" address="0x00009888" value="0x063A8000" />
+        <register type="NOA" address="0x00009888" value="0x08138000" />
+        <register type="NOA" address="0x00009888" value="0x0A138000" />
+        <register type="NOA" address="0x00009888" value="0x06143000" />
+        <register type="NOA" address="0x00009888" value="0x0415CFC7" />
+        <register type="NOA" address="0x00009888" value="0x10150000" />
+        <register type="NOA" address="0x00009888" value="0x02338000" />
+        <register type="NOA" address="0x00009888" value="0x0C338000" />
+        <register type="NOA" address="0x00009888" value="0x04342000" />
+        <register type="NOA" address="0x00009888" value="0x06344000" />
+        <register type="NOA" address="0x00009888" value="0x0035C700" />
+        <register type="NOA" address="0x00009888" value="0x063500CF" />
+        <register type="NOA" address="0x00009888" value="0x10350000" />
+        <register type="NOA" address="0x00009888" value="0x04538000" />
+        <register type="NOA" address="0x00009888" value="0x06538000" />
+        <register type="NOA" address="0x00009888" value="0x0454C000" />
+        <register type="NOA" address="0x00009888" value="0x0255CFC7" />
+        <register type="NOA" address="0x00009888" value="0x10550000" />
+        <register type="NOA" address="0x00009888" value="0x06DC8000" />
+        <register type="NOA" address="0x00009888" value="0x08DC4000" />
+        <register type="NOA" address="0x00009888" value="0x0CDCC000" />
+        <register type="NOA" address="0x00009888" value="0x0EDCC000" />
+        <register type="NOA" address="0x00009888" value="0x1ABD00A8" />
+        <register type="NOA" address="0x00009888" value="0x0CD8C000" />
+        <register type="NOA" address="0x00009888" value="0x0ED84000" />
+        <register type="NOA" address="0x00009888" value="0x0EDB8000" />
+        <register type="NOA" address="0x00009888" value="0x18DB0800" />
+        <register type="NOA" address="0x00009888" value="0x1ADB0254" />
+        <register type="NOA" address="0x00009888" value="0x0E9FAA00" />
+        <register type="NOA" address="0x00009888" value="0x109F02AA" />
+        <register type="NOA" address="0x00009888" value="0x0EB84000" />
+        <register type="NOA" address="0x00009888" value="0x16B84000" />
+        <register type="NOA" address="0x00009888" value="0x18B8156A" />
+        <register type="NOA" address="0x00009888" value="0x06B98000" />
+        <register type="NOA" address="0x00009888" value="0x08B9A000" />
+        <register type="NOA" address="0x00009888" value="0x0AB9A000" />
+        <register type="NOA" address="0x00009888" value="0x0CB9A000" />
+        <register type="NOA" address="0x00009888" value="0x0EB9A000" />
+        <register type="NOA" address="0x00009888" value="0x18BAA000" />
+        <register type="NOA" address="0x00009888" value="0x1ABA0002" />
+        <register type="NOA" address="0x00009888" value="0x16934000" />
+        <register type="NOA" address="0x00009888" value="0x1893000A" />
+        <register type="NOA" address="0x00009888" value="0x0A947000" />
+        <register type="NOA" address="0x00009888" value="0x0C95C5C1" />
+        <register type="NOA" address="0x00009888" value="0x0E9500C3" />
+        <register type="NOA" address="0x00009888" value="0x10950000" />
+        <register type="NOA" address="0x00009888" value="0x0EB38000" />
+        <register type="NOA" address="0x00009888" value="0x16B30040" />
+        <register type="NOA" address="0x00009888" value="0x18B30020" />
+        <register type="NOA" address="0x00009888" value="0x06B48000" />
+        <register type="NOA" address="0x00009888" value="0x08B41000" />
+        <register type="NOA" address="0x00009888" value="0x0AB48000" />
+        <register type="NOA" address="0x00009888" value="0x06B5C500" />
+        <register type="NOA" address="0x00009888" value="0x08B500C3" />
+        <register type="NOA" address="0x00009888" value="0x0EB5C100" />
+        <register type="NOA" address="0x00009888" value="0x10B50000" />
+        <register type="NOA" address="0x00009888" value="0x16D31500" />
+        <register type="NOA" address="0x00009888" value="0x08D4E000" />
+        <register type="NOA" address="0x00009888" value="0x08D5C100" />
+        <register type="NOA" address="0x00009888" value="0x0AD5C3C5" />
+        <register type="NOA" address="0x00009888" value="0x10D50000" />
+        <register type="NOA" address="0x00009888" value="0x0D88F800" />
+        <register type="NOA" address="0x00009888" value="0x0F88000F" />
+        <register type="NOA" address="0x00009888" value="0x038A8000" />
+        <register type="NOA" address="0x00009888" value="0x058A8000" />
+        <register type="NOA" address="0x00009888" value="0x078A8000" />
+        <register type="NOA" address="0x00009888" value="0x098A8000" />
+        <register type="NOA" address="0x00009888" value="0x0B8A8000" />
+        <register type="NOA" address="0x00009888" value="0x0D8A8000" />
+        <register type="NOA" address="0x00009888" value="0x258BAAA5" />
+        <register type="NOA" address="0x00009888" value="0x278B002A" />
+        <register type="NOA" address="0x00009888" value="0x238B2A80" />
+        <register type="NOA" address="0x00009888" value="0x0F8C4000" />
+        <register type="NOA" address="0x00009888" value="0x178C2000" />
+        <register type="NOA" address="0x00009888" value="0x198C5500" />
+        <register type="NOA" address="0x00009888" value="0x1B8C0015" />
+        <register type="NOA" address="0x00009888" value="0x078D8000" />
+        <register type="NOA" address="0x00009888" value="0x098DA000" />
+        <register type="NOA" address="0x00009888" value="0x0B8DA000" />
+        <register type="NOA" address="0x00009888" value="0x0D8DA000" />
+        <register type="NOA" address="0x00009888" value="0x0F8DA000" />
+        <register type="NOA" address="0x00009888" value="0x2185AAAA" />
+        <register type="NOA" address="0x00009888" value="0x2385002A" />
+        <register type="NOA" address="0x00009888" value="0x1F85AA00" />
+        <register type="NOA" address="0x00009888" value="0x0F834000" />
+        <register type="NOA" address="0x00009888" value="0x19835400" />
+        <register type="NOA" address="0x00009888" value="0x1B830155" />
+        <register type="NOA" address="0x00009888" value="0x03834000" />
+        <register type="NOA" address="0x00009888" value="0x05834000" />
+        <register type="NOA" address="0x00009888" value="0x07834000" />
+        <register type="NOA" address="0x00009888" value="0x09834000" />
+        <register type="NOA" address="0x00009888" value="0x0B834000" />
+        <register type="NOA" address="0x00009888" value="0x0D834000" />
+        <register type="NOA" address="0x00009888" value="0x0784C000" />
+        <register type="NOA" address="0x00009888" value="0x0984C000" />
+        <register type="NOA" address="0x00009888" value="0x0B84C000" />
+        <register type="NOA" address="0x00009888" value="0x0D84C000" />
+        <register type="NOA" address="0x00009888" value="0x0F84C000" />
+        <register type="NOA" address="0x00009888" value="0x01848000" />
+        <register type="NOA" address="0x00009888" value="0x0384C000" />
+        <register type="NOA" address="0x00009888" value="0x0584C000" />
+        <register type="NOA" address="0x00009888" value="0x1780C000" />
+        <register type="NOA" address="0x00009888" value="0x1980C000" />
+        <register type="NOA" address="0x00009888" value="0x1B80C000" />
+        <register type="NOA" address="0x00009888" value="0x1D80C000" />
+        <register type="NOA" address="0x00009888" value="0x1F80C000" />
+        <register type="NOA" address="0x00009888" value="0x11808000" />
+        <register type="NOA" address="0x00009888" value="0x1380C000" />
+        <register type="NOA" address="0x00009888" value="0x1580C000" />
+        <register type="NOA" address="0x00009888" value="0x4F800000" />
+        <register type="NOA" address="0x00009888" value="0x43800C42" />
+        <register type="NOA" address="0x00009888" value="0x51800000" />
+        <register type="NOA" address="0x00009888" value="0x45800063" />
+        <register type="NOA" address="0x00009888" value="0x53800000" />
+        <register type="NOA" address="0x00009888" value="0x47800800" />
+        <register type="NOA" address="0x00009888" value="0x21800000" />
+        <register type="NOA" address="0x00009888" value="0x31800000" />
+        <register type="NOA" address="0x00009888" value="0x4D800000" />
+        <register type="NOA" address="0x00009888" value="0x3F8014A4" />
+        <register type="NOA" address="0x00009888" value="0x41801042" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x30800000" />
+        <register type="OA" address="0x00002770" value="0x00000002" />
+        <register type="OA" address="0x00002774" value="0x0000FDFF" />
+        <register type="OA" address="0x00002778" value="0x00000000" />
+        <register type="OA" address="0x0000277C" value="0x0000FE7F" />
+        <register type="OA" address="0x00002780" value="0x00000002" />
+        <register type="OA" address="0x00002784" value="0x0000FFBF" />
+        <register type="OA" address="0x00002788" value="0x00000000" />
+        <register type="OA" address="0x0000278C" value="0x0000FFCF" />
+        <register type="OA" address="0x00002790" value="0x00000002" />
+        <register type="OA" address="0x00002794" value="0x0000FFF7" />
+        <register type="OA" address="0x00002798" value="0x00000000" />
+        <register type="OA" address="0x0000279C" value="0x0000FFF9" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set TDL_2"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="tdl_2"
+       hw_config_guid="dff6158e-8409-452c-be76-91c9946330bd"
+       chipset="CHV"
+       symbol_name="TDL_2"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Thread Header Ready on Slice1 Subslice1 Port 1"
+             description="The percentage of time in which thread header is ready on slice1 subslice1 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header11_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader11ReadyPort1"
+             availability="$SubsliceMask 0x10 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="NonPS Thread Ready For Dispatch on Slice0 Subslice2"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice2 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread02_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread02ReadyForDispatch"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="NonPS Thread Ready For Dispatch on Slice0 Subslice0"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice0 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread00_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread00ReadyForDispatch"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Thread Header Ready on Slice1 Subslice1 Port 0"
+             description="The percentage of time in which thread header is ready on slice1 subslice1 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header11_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader11ReadyPort0"
+             availability="$SubsliceMask 0x10 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Thread Header Ready on Slice1 Subslice2 Port 0"
+             description="The percentage of time in which thread header is ready on slice1 subslice2 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header12_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader12ReadyPort0"
+             availability="$SubsliceMask 0x20 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Subslice0"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice0 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread00_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread00ReadyForDispatch"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Thread Header Ready on Slice1 Subslice0 Port 1"
+             description="The percentage of time in which thread header is ready on slice1 subslice0 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header10_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader10ReadyPort1"
+             availability="$SubsliceMask 0x8 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Subslice1"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice1 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread01_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread01ReadyForDispatch"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Thread Header Ready on Slice1 Subslice2 Port 1"
+             description="The percentage of time in which thread header is ready on slice1 subslice2 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header12_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader12ReadyPort1"
+             availability="$SubsliceMask 0x20 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Subslice2"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice2 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread02_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread02ReadyForDispatch"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL 2 UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Thread Header Ready on Slice1 Subslice0 Port 0"
+             description="The percentage of time in which thread header is ready on slice1 subslice0 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header10_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader10ReadyPort0"
+             availability="$SubsliceMask 0x8 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="NonPS Thread Ready For Dispatch on Slice0 Subslice1"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice1 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread01_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread01ReadyForDispatch"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x16150000" />
+        <register type="NOA" address="0x00009888" value="0x16350000" />
+        <register type="NOA" address="0x00009888" value="0x16550000" />
+        <register type="NOA" address="0x00009888" value="0x16952E60" />
+        <register type="NOA" address="0x00009888" value="0x16B54D60" />
+        <register type="NOA" address="0x00009888" value="0x16D52E60" />
+        <register type="NOA" address="0x00009888" value="0x065C8000" />
+        <register type="NOA" address="0x00009888" value="0x085CC000" />
+        <register type="NOA" address="0x00009888" value="0x0A5CC000" />
+        <register type="NOA" address="0x00009888" value="0x0C5C4000" />
+        <register type="NOA" address="0x00009888" value="0x0E3D8000" />
+        <register type="NOA" address="0x00009888" value="0x183DA000" />
+        <register type="NOA" address="0x00009888" value="0x06588000" />
+        <register type="NOA" address="0x00009888" value="0x08588000" />
+        <register type="NOA" address="0x00009888" value="0x0A584000" />
+        <register type="NOA" address="0x00009888" value="0x0E5B4000" />
+        <register type="NOA" address="0x00009888" value="0x185B5800" />
+        <register type="NOA" address="0x00009888" value="0x1A5B000A" />
+        <register type="NOA" address="0x00009888" value="0x0E1FAA00" />
+        <register type="NOA" address="0x00009888" value="0x101F02AA" />
+        <register type="NOA" address="0x00009888" value="0x0E384000" />
+        <register type="NOA" address="0x00009888" value="0x16384000" />
+        <register type="NOA" address="0x00009888" value="0x18382A55" />
+        <register type="NOA" address="0x00009888" value="0x06398000" />
+        <register type="NOA" address="0x00009888" value="0x0839A000" />
+        <register type="NOA" address="0x00009888" value="0x0A39A000" />
+        <register type="NOA" address="0x00009888" value="0x0C39A000" />
+        <register type="NOA" address="0x00009888" value="0x0E39A000" />
+        <register type="NOA" address="0x00009888" value="0x1A3A02A0" />
+        <register type="NOA" address="0x00009888" value="0x0E138000" />
+        <register type="NOA" address="0x00009888" value="0x16130500" />
+        <register type="NOA" address="0x00009888" value="0x06148000" />
+        <register type="NOA" address="0x00009888" value="0x08146000" />
+        <register type="NOA" address="0x00009888" value="0x0615C100" />
+        <register type="NOA" address="0x00009888" value="0x0815C500" />
+        <register type="NOA" address="0x00009888" value="0x0A1500C3" />
+        <register type="NOA" address="0x00009888" value="0x10150000" />
+        <register type="NOA" address="0x00009888" value="0x16335040" />
+        <register type="NOA" address="0x00009888" value="0x08349000" />
+        <register type="NOA" address="0x00009888" value="0x0A341000" />
+        <register type="NOA" address="0x00009888" value="0x083500C1" />
+        <register type="NOA" address="0x00009888" value="0x0A35C500" />
+        <register type="NOA" address="0x00009888" value="0x0C3500C3" />
+        <register type="NOA" address="0x00009888" value="0x10350000" />
+        <register type="NOA" address="0x00009888" value="0x1853002A" />
+        <register type="NOA" address="0x00009888" value="0x0A54E000" />
+        <register type="NOA" address="0x00009888" value="0x0C55C500" />
+        <register type="NOA" address="0x00009888" value="0x0E55C1C3" />
+        <register type="NOA" address="0x00009888" value="0x10550000" />
+        <register type="NOA" address="0x00009888" value="0x00DC8000" />
+        <register type="NOA" address="0x00009888" value="0x02DCC000" />
+        <register type="NOA" address="0x00009888" value="0x04DC4000" />
+        <register type="NOA" address="0x00009888" value="0x04BD8000" />
+        <register type="NOA" address="0x00009888" value="0x06BD8000" />
+        <register type="NOA" address="0x00009888" value="0x02D8C000" />
+        <register type="NOA" address="0x00009888" value="0x02DB8000" />
+        <register type="NOA" address="0x00009888" value="0x04DB4000" />
+        <register type="NOA" address="0x00009888" value="0x06DB4000" />
+        <register type="NOA" address="0x00009888" value="0x08DB8000" />
+        <register type="NOA" address="0x00009888" value="0x0C9FA000" />
+        <register type="NOA" address="0x00009888" value="0x0E9F00AA" />
+        <register type="NOA" address="0x00009888" value="0x02B84000" />
+        <register type="NOA" address="0x00009888" value="0x04B84000" />
+        <register type="NOA" address="0x00009888" value="0x06B84000" />
+        <register type="NOA" address="0x00009888" value="0x08B84000" />
+        <register type="NOA" address="0x00009888" value="0x0AB88000" />
+        <register type="NOA" address="0x00009888" value="0x0CB88000" />
+        <register type="NOA" address="0x00009888" value="0x00B98000" />
+        <register type="NOA" address="0x00009888" value="0x02B9A000" />
+        <register type="NOA" address="0x00009888" value="0x04B9A000" />
+        <register type="NOA" address="0x00009888" value="0x06B92000" />
+        <register type="NOA" address="0x00009888" value="0x0ABA8000" />
+        <register type="NOA" address="0x00009888" value="0x0CBA8000" />
+        <register type="NOA" address="0x00009888" value="0x04938000" />
+        <register type="NOA" address="0x00009888" value="0x06938000" />
+        <register type="NOA" address="0x00009888" value="0x0494C000" />
+        <register type="NOA" address="0x00009888" value="0x0295CFC7" />
+        <register type="NOA" address="0x00009888" value="0x10950000" />
+        <register type="NOA" address="0x00009888" value="0x02B38000" />
+        <register type="NOA" address="0x00009888" value="0x08B38000" />
+        <register type="NOA" address="0x00009888" value="0x04B42000" />
+        <register type="NOA" address="0x00009888" value="0x06B41000" />
+        <register type="NOA" address="0x00009888" value="0x00B5C700" />
+        <register type="NOA" address="0x00009888" value="0x04B500CF" />
+        <register type="NOA" address="0x00009888" value="0x10B50000" />
+        <register type="NOA" address="0x00009888" value="0x0AD38000" />
+        <register type="NOA" address="0x00009888" value="0x0CD38000" />
+        <register type="NOA" address="0x00009888" value="0x06D46000" />
+        <register type="NOA" address="0x00009888" value="0x04D5C700" />
+        <register type="NOA" address="0x00009888" value="0x06D500CF" />
+        <register type="NOA" address="0x00009888" value="0x10D50000" />
+        <register type="NOA" address="0x00009888" value="0x03888000" />
+        <register type="NOA" address="0x00009888" value="0x05888000" />
+        <register type="NOA" address="0x00009888" value="0x07888000" />
+        <register type="NOA" address="0x00009888" value="0x09888000" />
+        <register type="NOA" address="0x00009888" value="0x0B888000" />
+        <register type="NOA" address="0x00009888" value="0x0D880400" />
+        <register type="NOA" address="0x00009888" value="0x0F8A8000" />
+        <register type="NOA" address="0x00009888" value="0x198A8000" />
+        <register type="NOA" address="0x00009888" value="0x1B8AAAA0" />
+        <register type="NOA" address="0x00009888" value="0x1D8A0002" />
+        <register type="NOA" address="0x00009888" value="0x258B555A" />
+        <register type="NOA" address="0x00009888" value="0x278B0015" />
+        <register type="NOA" address="0x00009888" value="0x238B5500" />
+        <register type="NOA" address="0x00009888" value="0x038C4000" />
+        <register type="NOA" address="0x00009888" value="0x058C4000" />
+        <register type="NOA" address="0x00009888" value="0x078C4000" />
+        <register type="NOA" address="0x00009888" value="0x098C4000" />
+        <register type="NOA" address="0x00009888" value="0x0B8C4000" />
+        <register type="NOA" address="0x00009888" value="0x0D8C4000" />
+        <register type="NOA" address="0x00009888" value="0x018D8000" />
+        <register type="NOA" address="0x00009888" value="0x038DA000" />
+        <register type="NOA" address="0x00009888" value="0x058DA000" />
+        <register type="NOA" address="0x00009888" value="0x078D2000" />
+        <register type="NOA" address="0x00009888" value="0x2185AAAA" />
+        <register type="NOA" address="0x00009888" value="0x2385002A" />
+        <register type="NOA" address="0x00009888" value="0x1F85AA00" />
+        <register type="NOA" address="0x00009888" value="0x0F834000" />
+        <register type="NOA" address="0x00009888" value="0x19835400" />
+        <register type="NOA" address="0x00009888" value="0x1B830155" />
+        <register type="NOA" address="0x00009888" value="0x03834000" />
+        <register type="NOA" address="0x00009888" value="0x05834000" />
+        <register type="NOA" address="0x00009888" value="0x07834000" />
+        <register type="NOA" address="0x00009888" value="0x09834000" />
+        <register type="NOA" address="0x00009888" value="0x0B834000" />
+        <register type="NOA" address="0x00009888" value="0x0D834000" />
+        <register type="NOA" address="0x00009888" value="0x0784C000" />
+        <register type="NOA" address="0x00009888" value="0x0984C000" />
+        <register type="NOA" address="0x00009888" value="0x0B84C000" />
+        <register type="NOA" address="0x00009888" value="0x0D84C000" />
+        <register type="NOA" address="0x00009888" value="0x0F84C000" />
+        <register type="NOA" address="0x00009888" value="0x01848000" />
+        <register type="NOA" address="0x00009888" value="0x0384C000" />
+        <register type="NOA" address="0x00009888" value="0x0584C000" />
+        <register type="NOA" address="0x00009888" value="0x1780C000" />
+        <register type="NOA" address="0x00009888" value="0x1980C000" />
+        <register type="NOA" address="0x00009888" value="0x1B80C000" />
+        <register type="NOA" address="0x00009888" value="0x1D80C000" />
+        <register type="NOA" address="0x00009888" value="0x1F80C000" />
+        <register type="NOA" address="0x00009888" value="0x11808000" />
+        <register type="NOA" address="0x00009888" value="0x1380C000" />
+        <register type="NOA" address="0x00009888" value="0x1580C000" />
+        <register type="NOA" address="0x00009888" value="0x4F800000" />
+        <register type="NOA" address="0x00009888" value="0x43800882" />
+        <register type="NOA" address="0x00009888" value="0x51800000" />
+        <register type="NOA" address="0x00009888" value="0x45801082" />
+        <register type="NOA" address="0x00009888" value="0x53800000" />
+        <register type="NOA" address="0x00009888" value="0x478014A5" />
+        <register type="NOA" address="0x00009888" value="0x21800000" />
+        <register type="NOA" address="0x00009888" value="0x31800000" />
+        <register type="NOA" address="0x00009888" value="0x4D800000" />
+        <register type="NOA" address="0x00009888" value="0x3F800002" />
+        <register type="NOA" address="0x00009888" value="0x41800C62" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x30800000" />
+        <register type="OA" address="0x00002770" value="0x00000002" />
+        <register type="OA" address="0x00002774" value="0x0000FDFF" />
+        <register type="OA" address="0x00002778" value="0x00000000" />
+        <register type="OA" address="0x0000277C" value="0x0000FE7F" />
+        <register type="OA" address="0x00002780" value="0x00000000" />
+        <register type="OA" address="0x00002784" value="0x0000FF9F" />
+        <register type="OA" address="0x00002788" value="0x00000000" />
+        <register type="OA" address="0x0000278C" value="0x0000FFE7" />
+        <register type="OA" address="0x00002790" value="0x00000002" />
+        <register type="OA" address="0x00002794" value="0x0000FFFB" />
+        <register type="OA" address="0x00002798" value="0x00000002" />
+        <register type="OA" address="0x0000279C" value="0x0000FFFD" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="MDAPI testing set Gen8LP"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="test_oa"
+       hw_config_guid="4a534b07-cba3-414d-8d60-874830e883aa"
+       chipset="CHV"
+       symbol_name="TestOa"
+       >
+    <counter name="TestCounter7"
+             description="HW test counter 7. Factor: 0.666"
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="counter7"
+             units="events"
+             symbol_name="Counter7"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="TestCounter8"
+             description="HW test counter 8. Should be equal to 1."
+             data_type="uint64"
+             equation="C 7 READ"
+             underscore_name="counter8"
+             units="events"
+             symbol_name="Counter8"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter4"
+             description="HW test counter 4. Factor: 0.333"
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="counter4"
+             units="events"
+             symbol_name="Counter4"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter5"
+             description="HW test counter 5. Factor: 0.333"
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="counter5"
+             units="events"
+             symbol_name="Counter5"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter6"
+             description="HW test counter 6. Factor: 0.166"
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="counter6"
+             units="events"
+             symbol_name="Counter6"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter3"
+             description="HW test counter 3. Factor: 0.5"
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="counter3"
+             units="events"
+             symbol_name="Counter3"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter0"
+             description="HW test counter 0. Factor: 0.0"
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="counter0"
+             units="events"
+             symbol_name="Counter0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter1"
+             description="HW test counter 1. Factor: 1.0"
+             data_type="uint64"
+             equation="B 1 READ"
+             underscore_name="counter1"
+             units="events"
+             symbol_name="Counter1"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter2"
+             description="HW test counter 2. Factor: 1.0"
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="counter2"
+             units="events"
+             symbol_name="Counter2"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x59800000" />
+        <register type="NOA" address="0x00009888" value="0x59800001" />
+        <register type="NOA" address="0x00009888" value="0x338B0000" />
+        <register type="NOA" address="0x00009888" value="0x258B0066" />
+        <register type="NOA" address="0x00009888" value="0x058B0000" />
+        <register type="NOA" address="0x00009888" value="0x038B0000" />
+        <register type="NOA" address="0x00009888" value="0x03844000" />
+        <register type="NOA" address="0x00009888" value="0x47800080" />
+        <register type="NOA" address="0x00009888" value="0x57800000" />
+        <register type="NOA" address="0x001823A4" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x59800000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x00000004" />
+        <register type="OA" address="0x00002774" value="0x00000000" />
+        <register type="OA" address="0x00002778" value="0x00000003" />
+        <register type="OA" address="0x0000277C" value="0x00000000" />
+        <register type="OA" address="0x00002780" value="0x00000007" />
+        <register type="OA" address="0x00002784" value="0x00000000" />
+        <register type="OA" address="0x00002788" value="0x00100002" />
+        <register type="OA" address="0x0000278C" value="0x0000FFF7" />
+        <register type="OA" address="0x00002790" value="0x00100002" />
+        <register type="OA" address="0x00002794" value="0x0000FFCF" />
+        <register type="OA" address="0x00002798" value="0x00100082" />
+        <register type="OA" address="0x0000279C" value="0x0000FFEF" />
+        <register type="OA" address="0x000027A0" value="0x001000C2" />
+        <register type="OA" address="0x000027A4" value="0x0000FFE7" />
+        <register type="OA" address="0x000027A8" value="0x00100001" />
+        <register type="OA" address="0x000027AC" value="0x0000FFE7" />
+    </register_config>
+  </set>
+
+</metrics>
diff --git a/lib/i915/perf-configs/oa-cnl.xml b/lib/i915/perf-configs/oa-cnl.xml
new file mode 100644
index 00000000..92582656
--- /dev/null
+++ b/lib/i915/perf-configs/oa-cnl.xml
@@ -0,0 +1,10411 @@
+<?xml version="1.0"?>
+<metrics version="1581935520" merge_md5="">
+  <set name="Render Metrics Basic Gen10"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="render_basic"
+       hw_config_guid="2d975e19-7130-41d2-b06f-79d74f91e7c8"
+       chipset="CNL"
+       symbol_name="RenderBasic"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Misses"
+             description="The total number of L3 misses."
+             data_type="uint64"
+             equation="C 2 READ C 3 READ UADD"
+             underscore_name="l3_misses"
+             units="messages"
+             symbol_name="L3Misses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/TAG"
+             />
+    <counter name="GTI L3 Throughput"
+             description="The total number of GPU memory bytes transferred between L3 caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="$L3Misses 64 UMUL"
+             underscore_name="gti_l3_throughput"
+             units="bytes"
+             symbol_name="GtiL3Throughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Cache Misses"
+             description="The total number of sampler cache misses in all LODs in all sampler units."
+             data_type="uint64"
+             equation="$SliceMask 1 AND B 4 READ UMUL $SliceMask 1 >> 1 AND B 5 READ UMUL UADD 8 UMUL"
+             underscore_name="sampler_l1_misses"
+             units="messages"
+             symbol_name="SamplerL1Misses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="L3 Sampler Throughput"
+             description="The total number of GPU memory bytes transferred between samplers and L3 caches."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="64 $SamplerL1Misses UMUL"
+             underscore_name="l3_sampler_throughput"
+             units="bytes"
+             symbol_name="L3SamplerThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Sampler"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Sampler00 Busy"
+             description="The percentage of time in which Slice0 Sampler0 has been processing EU requests."
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler00_busy"
+             units="percent"
+             symbol_name="Sampler00Busy"
+             availability="$SubsliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Sampler10 Busy"
+             description="The percentage of time in which Slice1 Sampler0 has been processing EU requests."
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler10_busy"
+             units="percent"
+             symbol_name="Sampler10Busy"
+             availability="$SubsliceMask 8 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Samplers Busy"
+             description="The percentage of time in which samplers have been processing EU requests."
+             data_type="float"
+             max_equation="100"
+             equation="$SubsliceMask 1 AND $Sampler00Busy FMUL $SubsliceMask 3 >> 1 AND $Sampler10Busy FMUL FADD $SubsliceMask 1 AND $SubsliceMask 3 >> 1 AND FADD FDIV"
+             underscore_name="samplers_busy"
+             units="percent"
+             symbol_name="SamplersBusy"
+             availability="$SubsliceMask 9 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="GTI Fixed Pipe Throughput"
+             description="The total number of GPU memory bytes transferred between 3D Pipeline (Command Dispatch, Input Assembly and Stream Output) and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="C 4 READ C 5 READ UADD 64 UMUL"
+             underscore_name="gti_vf_throughput"
+             units="bytes"
+             symbol_name="GtiVfThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/3D Pipe"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="L3 Lookup Accesses w/o IC"
+             description="The total number of L3 cache lookup accesses w/o IC."
+             data_type="uint64"
+             equation="$SamplerL1Misses $ShaderMemoryAccesses UADD"
+             underscore_name="l3_lookups"
+             units="messages"
+             symbol_name="L3Lookups"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/TAG"
+             />
+    <counter name="Sampler00 Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which Slice0 Sampler0 has been slowing down the pipe when processing EU requests."
+             data_type="float"
+             high_watermark="15"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="sampler00_bottleneck"
+             units="percent"
+             symbol_name="Sampler00Bottleneck"
+             availability="$SubsliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Read Throughput"
+             description="The total number of GPU memory bytes read from GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="64  C 6 READ UMUL"
+             underscore_name="gti_read_throughput"
+             units="bytes"
+             symbol_name="GtiReadThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Depth Throughput"
+             description="The total number of GPU memory bytes transferred between depth caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="128  B 6 READ UMUL"
+             underscore_name="gti_depth_throughput"
+             units="bytes"
+             symbol_name="GtiDepthThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/Depth Cache"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Sampler10 Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which Slice1 Sampler0 has been slowing down the pipe when processing EU requests."
+             data_type="float"
+             high_watermark="15"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="sampler10_bottleneck"
+             units="percent"
+             symbol_name="Sampler10Bottleneck"
+             availability="$SubsliceMask 8 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Samplers Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which samplers have been slowing down the pipe when processing EU requests."
+             data_type="float"
+             high_watermark="15"
+             equation="$SubsliceMask 1 AND $Sampler00Bottleneck FMUL $SubsliceMask 3 >> 1 AND $Sampler10Bottleneck FMUL FADD $SubsliceMask 1 AND $SubsliceMask 3 >> 1 AND FADD FDIV"
+             max_equation="100"
+             underscore_name="sampler_bottleneck"
+             units="percent"
+             symbol_name="SamplerBottleneck"
+             availability="$SubsliceMask 9 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Indicate System Frame Batch Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="GTI RCC Throughput"
+             description="The total number of GPU memory bytes transferred between render color caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="C 0 READ C 1 READ UADD 128 UMUL"
+             underscore_name="gti_rcc_throughput"
+             units="bytes"
+             symbol_name="GtiRccThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/Color Cache"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="GTI Write Throughput"
+             description="The total number of GPU memory bytes written to GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="64  C 7 READ UMUL"
+             underscore_name="gti_write_throughput"
+             units="bytes"
+             symbol_name="GtiWriteThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ A 31 READ UADD A 32 READ UADD 64 UMUL"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x146C0008" />
+        <register type="NOA" address="0x00009888" value="0x18110014" />
+        <register type="NOA" address="0x00009888" value="0x14EC0008" />
+        <register type="NOA" address="0x00009888" value="0x18910014" />
+        <register type="NOA" address="0x00009888" value="0x0A6C0054" />
+        <register type="NOA" address="0x00009888" value="0x106C0000" />
+        <register type="NOA" address="0x00009888" value="0x1A6C0444" />
+        <register type="NOA" address="0x00009888" value="0x02738000" />
+        <register type="NOA" address="0x00009888" value="0x0473E000" />
+        <register type="NOA" address="0x00009888" value="0x04742000" />
+        <register type="NOA" address="0x00009888" value="0x0C742000" />
+        <register type="NOA" address="0x00009888" value="0x04752000" />
+        <register type="NOA" address="0x00009888" value="0x0C752000" />
+        <register type="NOA" address="0x00009888" value="0x0C760800" />
+        <register type="NOA" address="0x00009888" value="0x0E760800" />
+        <register type="NOA" address="0x00009888" value="0x0077C000" />
+        <register type="NOA" address="0x00009888" value="0x0E778000" />
+        <register type="NOA" address="0x00009888" value="0x1477C000" />
+        <register type="NOA" address="0x00009888" value="0x167702A0" />
+        <register type="NOA" address="0x00009888" value="0x00194000" />
+        <register type="NOA" address="0x00009888" value="0x1A190020" />
+        <register type="NOA" address="0x00009888" value="0x00110060" />
+        <register type="NOA" address="0x00009888" value="0x08110061" />
+        <register type="NOA" address="0x00009888" value="0x1E110000" />
+        <register type="NOA" address="0x00009888" value="0x10110000" />
+        <register type="NOA" address="0x00009888" value="0x18144000" />
+        <register type="NOA" address="0x00009888" value="0x1C140400" />
+        <register type="NOA" address="0x00009888" value="0x0AEC5400" />
+        <register type="NOA" address="0x00009888" value="0x10EC0000" />
+        <register type="NOA" address="0x00009888" value="0x1AEC0000" />
+        <register type="NOA" address="0x00009888" value="0x04F38000" />
+        <register type="NOA" address="0x00009888" value="0x0AF48000" />
+        <register type="NOA" address="0x00009888" value="0x0CF48000" />
+        <register type="NOA" address="0x00009888" value="0x0AF58000" />
+        <register type="NOA" address="0x00009888" value="0x0CF58000" />
+        <register type="NOA" address="0x00009888" value="0x0EF62200" />
+        <register type="NOA" address="0x00009888" value="0x0EF7C000" />
+        <register type="NOA" address="0x00009888" value="0x16F70230" />
+        <register type="NOA" address="0x00009888" value="0x0E994000" />
+        <register type="NOA" address="0x00009888" value="0x1A990080" />
+        <register type="NOA" address="0x00009888" value="0x06916000" />
+        <register type="NOA" address="0x00009888" value="0x08916100" />
+        <register type="NOA" address="0x00009888" value="0x1E910000" />
+        <register type="NOA" address="0x00009888" value="0x1C941100" />
+        <register type="NOA" address="0x00009884" value="0x00000007" />
+        <register type="NOA" address="0x00009888" value="0x0B086F4F" />
+        <register type="NOA" address="0x00009888" value="0x0D080001" />
+        <register type="NOA" address="0x00009888" value="0x1D073800" />
+        <register type="NOA" address="0x00009888" value="0x1F070140" />
+        <register type="NOA" address="0x00009888" value="0x09081E93" />
+        <register type="NOA" address="0x00009888" value="0x01083160" />
+        <register type="NOA" address="0x00009888" value="0x030801A6" />
+        <register type="NOA" address="0x00009888" value="0x11080000" />
+        <register type="NOA" address="0x00009888" value="0x0F080000" />
+        <register type="NOA" address="0x00009888" value="0x0D095000" />
+        <register type="NOA" address="0x00009888" value="0x0F095000" />
+        <register type="NOA" address="0x00009888" value="0x01094000" />
+        <register type="NOA" address="0x00009888" value="0x03095000" />
+        <register type="NOA" address="0x00009888" value="0x05091000" />
+        <register type="NOA" address="0x00009888" value="0x13040154" />
+        <register type="NOA" address="0x00009888" value="0x09044000" />
+        <register type="NOA" address="0x00009888" value="0x0B045000" />
+        <register type="NOA" address="0x00009888" value="0x0D049000" />
+        <register type="NOA" address="0x00009888" value="0x0F042000" />
+        <register type="NOA" address="0x00009888" value="0x0507E700" />
+        <register type="NOA" address="0x00009888" value="0x070700D7" />
+        <register type="NOA" address="0x00009888" value="0x25070000" />
+        <register type="NOA" address="0x00009888" value="0x1B070000" />
+        <register type="NOA" address="0x00009888" value="0x1100C000" />
+        <register type="NOA" address="0x00009888" value="0x1F00C000" />
+        <register type="NOA" address="0x00009888" value="0x2100C000" />
+        <register type="NOA" address="0x00009888" value="0x2300C000" />
+        <register type="NOA" address="0x00009888" value="0x2500C000" />
+        <register type="NOA" address="0x00009888" value="0x2700C000" />
+        <register type="NOA" address="0x00009888" value="0x29004000" />
+        <register type="NOA" address="0x00009888" value="0x2B004000" />
+        <register type="NOA" address="0x00009888" value="0x2D004000" />
+        <register type="NOA" address="0x00009888" value="0x2F004000" />
+        <register type="NOA" address="0x00009888" value="0x13004000" />
+        <register type="NOA" address="0x00009888" value="0x15004000" />
+        <register type="NOA" address="0x00009888" value="0x17004000" />
+        <register type="NOA" address="0x00009888" value="0x19004000" />
+        <register type="NOA" address="0x00009888" value="0x1B004000" />
+        <register type="NOA" address="0x00009888" value="0x1D004000" />
+        <register type="NOA" address="0x00009888" value="0x47003331" />
+        <register type="NOA" address="0x00009888" value="0x390018C1" />
+        <register type="NOA" address="0x00009888" value="0x49000333" />
+        <register type="NOA" address="0x00009888" value="0x3D000407" />
+        <register type="NOA" address="0x00009888" value="0x4B001101" />
+        <register type="NOA" address="0x00009888" value="0x3F000120" />
+        <register type="NOA" address="0x00009888" value="0x4D003333" />
+        <register type="NOA" address="0x00009888" value="0x410018C6" />
+        <register type="NOA" address="0x00009888" value="0x35000000" />
+        <register type="NOA" address="0x00009888" value="0x31000000" />
+        <register type="NOA" address="0x00009888" value="0x43000006" />
+        <register type="NOA" address="0x00009888" value="0x3B001CC6" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x40800000" />
+        <register type="OA" address="0x000027A0" value="0x00000202" />
+        <register type="OA" address="0x000027A4" value="0x0000FF3F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00222222" />
+    </register_config>
+  </set>
+
+  <set name="Compute Metrics Basic Gen10"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="compute_basic"
+       hw_config_guid="eed14f91-5f03-4e3a-8281-ac38030ac573"
+       chipset="CNL"
+       symbol_name="ComputeBasic"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Untyped Bytes Read"
+             description="The total number of typed memory bytes read via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="$EuSubslicesTotalCount $SubsliceMask 1 AND C 2 READ FMUL $SubsliceMask 3 >> 1 AND C 3 READ FMUL FADD FMUL $SubsliceMask 1 AND $SubsliceMask 3 >> 1 AND FADD FDIV 64 UMUL"
+             underscore_name="untyped_bytes_read"
+             units="bytes"
+             symbol_name="UntypedBytesRead"
+             availability="$SubsliceMask 9 AND "
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Typed Bytes Written"
+             description="The total number of untyped memory bytes written via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="$SubsliceMask 1 AND B 5 READ UMUL $SubsliceMask 1 >> 1 AND B 6 READ UMUL UADD $SubsliceMask 2 >> 1 AND B 7 READ UMUL UADD $SubsliceMask 3 >> 1 AND C 0 READ UMUL UADD $SubsliceMask 4 >> 1 AND C 1 READ UMUL UADD 64 UMUL"
+             underscore_name="typed_bytes_written"
+             units="bytes"
+             symbol_name="TypedBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU AVG IPC Rate"
+             description="The average rate of IPC calculated for 2 FPU pipelines."
+             data_type="float"
+             max_equation="2"
+             equation="A 9 READ A 10 READ A 11 READ FADD A 9 READ FSUB FDIV 1 FADD"
+             underscore_name="eu_avg_ipc_rate"
+             units="number"
+             symbol_name="EuAvgIpcRate"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="EU FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active"
+             units="percent"
+             symbol_name="Fpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu0_active"
+             units="percent"
+             symbol_name="Fpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Read Throughput"
+             description="The total number of GPU memory bytes read from GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="64  C 6 READ UMUL"
+             underscore_name="gti_read_throughput"
+             units="bytes"
+             symbol_name="GtiReadThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Untyped Writes"
+             description="The total number of untyped memory bytes written via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="$EuSubslicesTotalCount $SubsliceMask 1 AND C 4 READ FMUL $SubsliceMask 3 >> 1 AND C 5 READ FMUL FADD FMUL $SubsliceMask 1 AND $SubsliceMask 3 >> 1 AND FADD FDIV 64 UMUL"
+             underscore_name="untyped_bytes_written"
+             units="bytes"
+             symbol_name="UntypedBytesWritten"
+             availability="$SubsliceMask 9 AND"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="Typed Bytes Read"
+             description="The total number of typed memory bytes read via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="$SubsliceMask 1 AND B 0 READ UMUL $SubsliceMask 1 >> 1 AND B 1 READ UMUL UADD $SubsliceMask 2 >> 1 AND B 2 READ UMUL UADD $SubsliceMask 3 >> 1 AND B 3 READ UMUL UADD $SubsliceMask 4 >> 1 AND B 4 READ UMUL UADD 64 UMUL"
+             underscore_name="typed_bytes_read"
+             units="bytes"
+             symbol_name="TypedBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="EU Thread Occupancy"
+             description="The percentage of time in which hardware threads occupied EUs."
+             data_type="float"
+             max_equation="100"
+             equation="8 A 13 READ FMUL $EuThreadsCount FDIV $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_thread_occupancy"
+             units="percent"
+             symbol_name="EuThreadOccupancy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="GTI Write Throughput"
+             description="The total number of GPU memory bytes written to GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="64  C 7 READ UMUL"
+             underscore_name="gti_write_throughput"
+             units="bytes"
+             symbol_name="GtiWriteThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ A 31 READ UADD A 32 READ UADD 64 UMUL"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="EU Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_send_active"
+             units="percent"
+             symbol_name="EuSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x121A0000" />
+        <register type="NOA" address="0x00009888" value="0x101A0007" />
+        <register type="NOA" address="0x00009888" value="0x123A0000" />
+        <register type="NOA" address="0x00009888" value="0x129A0000" />
+        <register type="NOA" address="0x00009888" value="0x109A0007" />
+        <register type="NOA" address="0x00009888" value="0x12BA0000" />
+        <register type="NOA" address="0x00009888" value="0x125A0000" />
+        <register type="NOA" address="0x00009888" value="0x1A6C0140" />
+        <register type="NOA" address="0x00009888" value="0x1C6C0005" />
+        <register type="NOA" address="0x00009888" value="0x186C0880" />
+        <register type="NOA" address="0x00009888" value="0x04736000" />
+        <register type="NOA" address="0x00009888" value="0x0673C000" />
+        <register type="NOA" address="0x00009888" value="0x00734000" />
+        <register type="NOA" address="0x00009888" value="0x02731000" />
+        <register type="NOA" address="0x00009888" value="0x0474A000" />
+        <register type="NOA" address="0x00009888" value="0x0E748000" />
+        <register type="NOA" address="0x00009888" value="0x06748000" />
+        <register type="NOA" address="0x00009888" value="0x0475A000" />
+        <register type="NOA" address="0x00009888" value="0x0E758000" />
+        <register type="NOA" address="0x00009888" value="0x06758000" />
+        <register type="NOA" address="0x00009888" value="0x0C762800" />
+        <register type="NOA" address="0x00009888" value="0x10760002" />
+        <register type="NOA" address="0x00009888" value="0x0E760002" />
+        <register type="NOA" address="0x00009888" value="0x0077C000" />
+        <register type="NOA" address="0x00009888" value="0x0E774000" />
+        <register type="NOA" address="0x00009888" value="0x14774000" />
+        <register type="NOA" address="0x00009888" value="0x167797A0" />
+        <register type="NOA" address="0x00009888" value="0x18770002" />
+        <register type="NOA" address="0x00009888" value="0x0277C000" />
+        <register type="NOA" address="0x00009888" value="0x04778000" />
+        <register type="NOA" address="0x00009888" value="0x0677C000" />
+        <register type="NOA" address="0x00009888" value="0x08778000" />
+        <register type="NOA" address="0x00009888" value="0x0A7B0A00" />
+        <register type="NOA" address="0x00009888" value="0x0C7B0028" />
+        <register type="NOA" address="0x00009888" value="0x0E7C8000" />
+        <register type="NOA" address="0x00009888" value="0x147C0C00" />
+        <register type="NOA" address="0x00009888" value="0x167C0038" />
+        <register type="NOA" address="0x00009888" value="0x1C7D2000" />
+        <register type="NOA" address="0x00009888" value="0x1E7D0080" />
+        <register type="NOA" address="0x00009888" value="0x0019C000" />
+        <register type="NOA" address="0x00009888" value="0x1A191800" />
+        <register type="NOA" address="0x00009888" value="0x0219C000" />
+        <register type="NOA" address="0x00009888" value="0x0619C000" />
+        <register type="NOA" address="0x00009888" value="0x001A2E52" />
+        <register type="NOA" address="0x00009888" value="0x0A1A2880" />
+        <register type="NOA" address="0x00009888" value="0x021A2D80" />
+        <register type="NOA" address="0x00009888" value="0x0E39C000" />
+        <register type="NOA" address="0x00009888" value="0x1A396000" />
+        <register type="NOA" address="0x00009888" value="0x063A2900" />
+        <register type="NOA" address="0x00009888" value="0x0C3A0051" />
+        <register type="NOA" address="0x00009888" value="0x003A0000" />
+        <register type="NOA" address="0x00009888" value="0x0CF48000" />
+        <register type="NOA" address="0x00009888" value="0x12F40400" />
+        <register type="NOA" address="0x00009888" value="0x06F42000" />
+        <register type="NOA" address="0x00009888" value="0x08F42000" />
+        <register type="NOA" address="0x00009888" value="0x0CF58000" />
+        <register type="NOA" address="0x00009888" value="0x14F50020" />
+        <register type="NOA" address="0x00009888" value="0x06F52000" />
+        <register type="NOA" address="0x00009888" value="0x08F52000" />
+        <register type="NOA" address="0x00009888" value="0x0EF62008" />
+        <register type="NOA" address="0x00009888" value="0x10F60080" />
+        <register type="NOA" address="0x00009888" value="0x0CF68000" />
+        <register type="NOA" address="0x00009888" value="0x16F7C070" />
+        <register type="NOA" address="0x00009888" value="0x18F70001" />
+        <register type="NOA" address="0x00009888" value="0x04F7C000" />
+        <register type="NOA" address="0x00009888" value="0x08F7C000" />
+        <register type="NOA" address="0x00009888" value="0x0AFB8000" />
+        <register type="NOA" address="0x00009888" value="0x0CFB0200" />
+        <register type="NOA" address="0x00009888" value="0x14FC8000" />
+        <register type="NOA" address="0x00009888" value="0x16FC0200" />
+        <register type="NOA" address="0x00009888" value="0x1EFD2008" />
+        <register type="NOA" address="0x00009888" value="0x1A990180" />
+        <register type="NOA" address="0x00009888" value="0x1C99000C" />
+        <register type="NOA" address="0x00009888" value="0x0499C000" />
+        <register type="NOA" address="0x00009888" value="0x0899C000" />
+        <register type="NOA" address="0x00009888" value="0x089A2900" />
+        <register type="NOA" address="0x00009888" value="0x0E9A0051" />
+        <register type="NOA" address="0x00009888" value="0x029A005C" />
+        <register type="NOA" address="0x00009888" value="0x049A005B" />
+        <register type="NOA" address="0x00009888" value="0x009A0000" />
+        <register type="NOA" address="0x00009888" value="0x1AB90600" />
+        <register type="NOA" address="0x00009888" value="0x1CB90030" />
+        <register type="NOA" address="0x00009888" value="0x0ABA0052" />
+        <register type="NOA" address="0x00009888" value="0x0EBA2880" />
+        <register type="NOA" address="0x00009888" value="0x00BA0000" />
+        <register type="NOA" address="0x00009888" value="0x1A590060" />
+        <register type="NOA" address="0x00009888" value="0x1C590003" />
+        <register type="NOA" address="0x00009888" value="0x085A0052" />
+        <register type="NOA" address="0x00009888" value="0x0C5A2880" />
+        <register type="NOA" address="0x00009888" value="0x005A0000" />
+        <register type="NOA" address="0x00009884" value="0x00000007" />
+        <register type="NOA" address="0x00009888" value="0x1D073800" />
+        <register type="NOA" address="0x00009888" value="0x1F070140" />
+        <register type="NOA" address="0x00009888" value="0x0D048000" />
+        <register type="NOA" address="0x00009888" value="0x0F042000" />
+        <register type="NOA" address="0x00009888" value="0x0507E700" />
+        <register type="NOA" address="0x00009888" value="0x070700D7" />
+        <register type="NOA" address="0x00009888" value="0x25070000" />
+        <register type="NOA" address="0x00009888" value="0x1B070000" />
+        <register type="NOA" address="0x00009888" value="0x1100C000" />
+        <register type="NOA" address="0x00009888" value="0x1F00C000" />
+        <register type="NOA" address="0x00009888" value="0x2100C000" />
+        <register type="NOA" address="0x00009888" value="0x2300C000" />
+        <register type="NOA" address="0x00009888" value="0x2500C000" />
+        <register type="NOA" address="0x00009888" value="0x2700C000" />
+        <register type="NOA" address="0x00009888" value="0x2900C000" />
+        <register type="NOA" address="0x00009888" value="0x2B00C000" />
+        <register type="NOA" address="0x00009888" value="0x2D00C000" />
+        <register type="NOA" address="0x00009888" value="0x2F00C000" />
+        <register type="NOA" address="0x00009888" value="0x1300C000" />
+        <register type="NOA" address="0x00009888" value="0x1500C000" />
+        <register type="NOA" address="0x00009888" value="0x1700C000" />
+        <register type="NOA" address="0x00009888" value="0x1900C000" />
+        <register type="NOA" address="0x00009888" value="0x1B004000" />
+        <register type="NOA" address="0x00009888" value="0x1D004000" />
+        <register type="NOA" address="0x00009888" value="0x47001011" />
+        <register type="NOA" address="0x00009888" value="0x39000021" />
+        <register type="NOA" address="0x00009888" value="0x49001330" />
+        <register type="NOA" address="0x00009888" value="0x3D001026" />
+        <register type="NOA" address="0x00009888" value="0x4B001000" />
+        <register type="NOA" address="0x00009888" value="0x3F000400" />
+        <register type="NOA" address="0x00009888" value="0x4D000001" />
+        <register type="NOA" address="0x00009888" value="0x41000081" />
+        <register type="NOA" address="0x00009888" value="0x35000000" />
+        <register type="NOA" address="0x00009888" value="0x31000000" />
+        <register type="NOA" address="0x00009888" value="0x43000000" />
+        <register type="NOA" address="0x00009888" value="0x3B001801" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00000003" />
+        <register type="FLEX" address="0x0000E658" value="0x00002001" />
+        <register type="FLEX" address="0x0000E758" value="0x00000008" />
+    </register_config>
+  </set>
+
+  <set name="Render Metrics for 3D Pipeline Profile Gen10"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="render_pipe_profile"
+       hw_config_guid="0666ccac-f5aa-4dc2-aa12-c6e058f383f3"
+       chipset="CNL"
+       symbol_name="RenderPipeProfile"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Bottleneck"
+             low_watermark="10"
+             description="The percentage of time in which vertex shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="30"
+             equation="C 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="vs_bottleneck"
+             units="percent"
+             symbol_name="VsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Hi-Depth Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which early hierarchical depth test pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="hi_depth_bottleneck"
+             units="percent"
+             symbol_name="HiDepthBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which geometry shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="C 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="gs_bottleneck"
+             units="percent"
+             symbol_name="GsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Geometry Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="BC Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which barycentric coordinates calculation pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="bc_bottleneck"
+             units="percent"
+             symbol_name="BcBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Barycentric Calc"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HS Stall"
+             description="The percentage of time in which hull stall pipeline stage was stalled."
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="hs_stall"
+             units="percent"
+             symbol_name="HsStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_group="3D Pipe/Hull Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="VF Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which vertex fetch pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="vf_bottleneck"
+             units="percent"
+             symbol_name="VfBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Input Assembler"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Strip-Fans Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which strip-fans pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="10"
+             equation="B 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="sf_bottleneck"
+             units="percent"
+             symbol_name="SfBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Strip-Fans"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SF Stall"
+             description="The percentage of time in which strip-fans pipeline stage was stalled."
+             data_type="float"
+             max_equation="100"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sf_stall"
+             units="percent"
+             symbol_name="SfStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Strip-Fans"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HS Bottleneck"
+             low_watermark="3"
+             description="The percentage of time in which hull shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="9"
+             equation="C 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="hs_bottleneck"
+             units="percent"
+             symbol_name="HsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Hull Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="CL Stall"
+             description="The percentage of time in which clipper pipeline stage was stalled."
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="cl_stall"
+             units="percent"
+             symbol_name="ClStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_group="3D Pipe/Clipper"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SO Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which stream output pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="so_bottleneck"
+             units="percent"
+             symbol_name="SoBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Stream Output"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="DS Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which domain shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="C 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="ds_bottleneck"
+             units="percent"
+             symbol_name="DsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Domain Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Clipper Bottleneck"
+             low_watermark="10"
+             description="The percentage of time in which clipper pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="30"
+             equation="B 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="cl_bottleneck"
+             units="percent"
+             symbol_name="ClBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Clipper"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Stall"
+             description="The percentage of time in which domain shader pipeline stage was stalled."
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ds_stall"
+             units="percent"
+             symbol_name="DsStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_group="3D Pipe/Domain Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Early Depth Bottleneck"
+             low_watermark="10"
+             description="The percentage of time in which early depth test pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="30"
+             equation="B 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="early_depth_bottleneck"
+             units="percent"
+             symbol_name="EarlyDepthBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ A 31 READ UADD A 32 READ UADD 64 UMUL"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SO Stall"
+             description="The percentage of time in which stream-output pipeline stage was stalled."
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="so_stall"
+             units="percent"
+             symbol_name="SoStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_group="3D Pipe/Stream Output"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x0A7003E0" />
+        <register type="NOA" address="0x00009888" value="0x0A710000" />
+        <register type="NOA" address="0x00009888" value="0x1017001E" />
+        <register type="NOA" address="0x00009888" value="0x06700015" />
+        <register type="NOA" address="0x00009888" value="0x00700000" />
+        <register type="NOA" address="0x00009888" value="0x06710800" />
+        <register type="NOA" address="0x00009888" value="0x00710000" />
+        <register type="NOA" address="0x00009888" value="0x0C746000" />
+        <register type="NOA" address="0x00009888" value="0x0C75A000" />
+        <register type="NOA" address="0x00009888" value="0x0E754000" />
+        <register type="NOA" address="0x00009888" value="0x0E762800" />
+        <register type="NOA" address="0x00009888" value="0x10760002" />
+        <register type="NOA" address="0x00009888" value="0x1477C000" />
+        <register type="NOA" address="0x00009888" value="0x16770330" />
+        <register type="NOA" address="0x00009888" value="0x1A190040" />
+        <register type="NOA" address="0x00009888" value="0x08170001" />
+        <register type="NOA" address="0x00009888" value="0x1C170000" />
+        <register type="NOA" address="0x00009884" value="0x00000007" />
+        <register type="NOA" address="0x00009888" value="0x01160031" />
+        <register type="NOA" address="0x00009888" value="0x11177C00" />
+        <register type="NOA" address="0x00009888" value="0x11187C00" />
+        <register type="NOA" address="0x00009888" value="0x05190000" />
+        <register type="NOA" address="0x00009888" value="0x110E7800" />
+        <register type="NOA" address="0x00009888" value="0x130F0000" />
+        <register type="NOA" address="0x00009888" value="0x15120000" />
+        <register type="NOA" address="0x00009888" value="0x11130019" />
+        <register type="NOA" address="0x00009888" value="0x0F160C80" />
+        <register type="NOA" address="0x00009888" value="0x0B160000" />
+        <register type="NOA" address="0x00009888" value="0x07162000" />
+        <register type="NOA" address="0x00009888" value="0x03168000" />
+        <register type="NOA" address="0x00009888" value="0x071705C0" />
+        <register type="NOA" address="0x00009888" value="0x011704C0" />
+        <register type="NOA" address="0x00009888" value="0x05170000" />
+        <register type="NOA" address="0x00009888" value="0x0B180015" />
+        <register type="NOA" address="0x00009888" value="0x01185000" />
+        <register type="NOA" address="0x00009888" value="0x07185000" />
+        <register type="NOA" address="0x00009888" value="0x0D185000" />
+        <register type="NOA" address="0x00009888" value="0x0F185000" />
+        <register type="NOA" address="0x00009888" value="0x03186000" />
+        <register type="NOA" address="0x00009888" value="0x05185000" />
+        <register type="NOA" address="0x00009888" value="0x03190022" />
+        <register type="NOA" address="0x00009888" value="0x0F190000" />
+        <register type="NOA" address="0x00009888" value="0x09190000" />
+        <register type="NOA" address="0x00009888" value="0x0D0E8023" />
+        <register type="NOA" address="0x00009888" value="0x030E1100" />
+        <register type="NOA" address="0x00009888" value="0x050E4000" />
+        <register type="NOA" address="0x00009888" value="0x0D0F0180" />
+        <register type="NOA" address="0x00009888" value="0x050F0001" />
+        <register type="NOA" address="0x00009888" value="0x010F0000" />
+        <register type="NOA" address="0x00009888" value="0x1B100054" />
+        <register type="NOA" address="0x00009888" value="0x07104000" />
+        <register type="NOA" address="0x00009888" value="0x09104000" />
+        <register type="NOA" address="0x00009888" value="0x0B104000" />
+        <register type="NOA" address="0x00009888" value="0x0D104000" />
+        <register type="NOA" address="0x00009888" value="0x1B114000" />
+        <register type="NOA" address="0x00009888" value="0x1D110006" />
+        <register type="NOA" address="0x00009888" value="0x07118000" />
+        <register type="NOA" address="0x00009888" value="0x09118000" />
+        <register type="NOA" address="0x00009888" value="0x0B114000" />
+        <register type="NOA" address="0x00009888" value="0x0D114000" />
+        <register type="NOA" address="0x00009888" value="0x05127100" />
+        <register type="NOA" address="0x00009888" value="0x07120073" />
+        <register type="NOA" address="0x00009888" value="0x21120001" />
+        <register type="NOA" address="0x00009888" value="0x1F120000" />
+        <register type="NOA" address="0x00009888" value="0x0F130002" />
+        <register type="NOA" address="0x00009888" value="0x01130000" />
+        <register type="NOA" address="0x00009888" value="0x0B144000" />
+        <register type="NOA" address="0x00009888" value="0x0F144025" />
+        <register type="NOA" address="0x00009888" value="0x11140025" />
+        <register type="NOA" address="0x00009888" value="0x0D145200" />
+        <register type="NOA" address="0x00009888" value="0x11158000" />
+        <register type="NOA" address="0x00009888" value="0x1F158080" />
+        <register type="NOA" address="0x00009888" value="0x13158000" />
+        <register type="NOA" address="0x00009888" value="0x0109A000" />
+        <register type="NOA" address="0x00009888" value="0x0709A000" />
+        <register type="NOA" address="0x00009888" value="0x0B092000" />
+        <register type="NOA" address="0x00009888" value="0x0D09A000" />
+        <register type="NOA" address="0x00009888" value="0x0F09A000" />
+        <register type="NOA" address="0x00009888" value="0x0309A000" />
+        <register type="NOA" address="0x00009888" value="0x0509A000" />
+        <register type="NOA" address="0x00009888" value="0x010BC000" />
+        <register type="NOA" address="0x00009888" value="0x070BC000" />
+        <register type="NOA" address="0x00009888" value="0x0B0B4000" />
+        <register type="NOA" address="0x00009888" value="0x0D0BC000" />
+        <register type="NOA" address="0x00009888" value="0x0F0BC000" />
+        <register type="NOA" address="0x00009888" value="0x030BC000" />
+        <register type="NOA" address="0x00009888" value="0x050BC000" />
+        <register type="NOA" address="0x00009888" value="0x09045000" />
+        <register type="NOA" address="0x00009888" value="0x0F045000" />
+        <register type="NOA" address="0x00009888" value="0x11044000" />
+        <register type="NOA" address="0x00009888" value="0x13040154" />
+        <register type="NOA" address="0x00009888" value="0x0B045000" />
+        <register type="NOA" address="0x00009888" value="0x0D045000" />
+        <register type="NOA" address="0x00009888" value="0x11004000" />
+        <register type="NOA" address="0x00009888" value="0x1F004000" />
+        <register type="NOA" address="0x00009888" value="0x2100C000" />
+        <register type="NOA" address="0x00009888" value="0x2300C000" />
+        <register type="NOA" address="0x00009888" value="0x25004000" />
+        <register type="NOA" address="0x00009888" value="0x2700C000" />
+        <register type="NOA" address="0x00009888" value="0x29004000" />
+        <register type="NOA" address="0x00009888" value="0x2B004000" />
+        <register type="NOA" address="0x00009888" value="0x2D004000" />
+        <register type="NOA" address="0x00009888" value="0x2F004000" />
+        <register type="NOA" address="0x00009888" value="0x13004000" />
+        <register type="NOA" address="0x00009888" value="0x15004000" />
+        <register type="NOA" address="0x00009888" value="0x17004000" />
+        <register type="NOA" address="0x00009888" value="0x19004000" />
+        <register type="NOA" address="0x00009888" value="0x1B004000" />
+        <register type="NOA" address="0x00009888" value="0x1D004000" />
+        <register type="NOA" address="0x00009888" value="0x47001111" />
+        <register type="NOA" address="0x00009888" value="0x39001022" />
+        <register type="NOA" address="0x00009888" value="0x49001111" />
+        <register type="NOA" address="0x00009888" value="0x3D000021" />
+        <register type="NOA" address="0x00009888" value="0x4B000100" />
+        <register type="NOA" address="0x00009888" value="0x3F0018A5" />
+        <register type="NOA" address="0x00009888" value="0x4D001111" />
+        <register type="NOA" address="0x00009888" value="0x41000001" />
+        <register type="NOA" address="0x00009888" value="0x35000000" />
+        <register type="NOA" address="0x00009888" value="0x31000000" />
+        <register type="NOA" address="0x00009888" value="0x43000002" />
+        <register type="NOA" address="0x00009888" value="0x3B000401" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+    </register_config>
+  </set>
+
+  <set name="Memory Reads Distribution Gen10"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="memory_reads"
+       hw_config_guid="3500dcfd-837b-4ec8-b5cf-fe58b966263f"
+       chipset="CNL"
+       symbol_name="MemoryReads"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiL3Bank0Reads"
+             description="The total number of GTI memory reads from L3 Bank 0 (L3 Cache misses)."
+             data_type="uint64"
+             equation="C 1 READ"
+             underscore_name="gti_l3_bank0_reads"
+             units="messages"
+             symbol_name="GtiL3Bank0Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="GtiRingAccesses"
+             description="The total number of all accesses from GTI to the ring."
+             data_type="uint64"
+             equation="C 7 READ"
+             underscore_name="gti_ring_accesses"
+             units="messages"
+             symbol_name="GtiRingAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="GtiRsMemoryReads"
+             description="The total number of GTI memory reads from Resource Streamer."
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="gti_rs_memory_reads"
+             units="messages"
+             symbol_name="GtiRsMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Resource Streamer"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GtiHizMemoryReads"
+             description="The total number of GTI memory reads from Hierarchical Depth Cache (Hi-Depth Cache misses)."
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="gti_hiz_memory_reads"
+             units="messages"
+             symbol_name="GtiHizMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="GtiRccMemoryReads"
+             description="The total number of GTI memory reads from Render Color Cache (Render Color Cache misses)."
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="gti_rcc_memory_reads"
+             units="messages"
+             symbol_name="GtiRccMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Color Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiL3Bank1Reads"
+             description="The total number of GTI memory reads from L3 Bank 1 (L3 Cache misses)."
+             data_type="uint64"
+             equation="C 2 READ"
+             underscore_name="gti_l3_bank1_reads"
+             units="messages"
+             symbol_name="GtiL3Bank1Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiCmdStreamerMemoryReads"
+             description="The total number of GTI memory reads from Command Streamer."
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="gti_cmd_streamer_memory_reads"
+             units="messages"
+             symbol_name="GtiCmdStreamerMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Command Streamer"
+             />
+    <counter name="GtiL3Bank2Reads"
+             description="The total number of GTI memory reads from L3 Bank 2 (L3 Cache misses)."
+             data_type="uint64"
+             equation="C 3 READ"
+             underscore_name="gti_l3_bank2_reads"
+             units="messages"
+             symbol_name="GtiL3Bank2Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiMemoryReads"
+             description="The total number of GTI memory reads."
+             data_type="uint64"
+             equation="C 0 READ"
+             underscore_name="gti_memory_reads"
+             units="messages"
+             symbol_name="GtiMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="GtiRczMemoryReads"
+             description="The total number of GTI memory reads from Render Depth Cache (Render Depth Cache misses)."
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="gti_rcz_memory_reads"
+             units="messages"
+             symbol_name="GtiRczMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="GtiMscMemoryReads"
+             description="The total number of GTI memory reads from Multisampling Color Cache (Multisampling Color Cache misses)."
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="gti_msc_memory_reads"
+             units="messages"
+             symbol_name="GtiMscMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Color Cache"
+             />
+    <counter name="GtiVfMemoryReads"
+             description="The total number of GTI memory reads from Vertex Fetch."
+             data_type="uint64"
+             equation="B 1 READ"
+             underscore_name="gti_vf_memory_reads"
+             units="messages"
+             symbol_name="GtiVfMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Vertex Fetch"
+             />
+    <counter name="GtiStcMemoryReads"
+             description="The total number of GTI memory reads from Stencil Cache (Stencil Cache misses)."
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="gti_stc_memory_reads"
+             units="messages"
+             symbol_name="GtiStcMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiL3Reads"
+             description="The total number of GTI memory reads from L3 (L3 Cache misses)."
+             data_type="uint64"
+             equation="$GtiL3Bank0Reads $GtiL3Bank1Reads UADD $GtiL3Bank2Reads UADD"
+             underscore_name="gti_l3_reads"
+             units="messages"
+             symbol_name="GtiL3Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009884" value="0x00000007" />
+        <register type="NOA" address="0x00009888" value="0x17066860" />
+        <register type="NOA" address="0x00009888" value="0x15070017" />
+        <register type="NOA" address="0x00009888" value="0x1F072920" />
+        <register type="NOA" address="0x00009888" value="0x1B038000" />
+        <register type="NOA" address="0x00009888" value="0x0D038000" />
+        <register type="NOA" address="0x00009888" value="0x0F034000" />
+        <register type="NOA" address="0x00009888" value="0x0F063180" />
+        <register type="NOA" address="0x00009888" value="0x01063100" />
+        <register type="NOA" address="0x00009888" value="0x0306006B" />
+        <register type="NOA" address="0x00009888" value="0x05060000" />
+        <register type="NOA" address="0x00009888" value="0x11080100" />
+        <register type="NOA" address="0x00009888" value="0x0D085000" />
+        <register type="NOA" address="0x00009888" value="0x0F094000" />
+        <register type="NOA" address="0x00009888" value="0x01094000" />
+        <register type="NOA" address="0x00009888" value="0x03091000" />
+        <register type="NOA" address="0x00009888" value="0x09046000" />
+        <register type="NOA" address="0x00009888" value="0x0F04A000" />
+        <register type="NOA" address="0x00009888" value="0x1104A800" />
+        <register type="NOA" address="0x00009888" value="0x130401AA" />
+        <register type="NOA" address="0x00009888" value="0x0B041000" />
+        <register type="NOA" address="0x00009888" value="0x010700E0" />
+        <register type="NOA" address="0x00009888" value="0x0707E153" />
+        <register type="NOA" address="0x00009888" value="0x0907E3E2" />
+        <register type="NOA" address="0x00009888" value="0x0B07E5E4" />
+        <register type="NOA" address="0x00009888" value="0x0D07E7E6" />
+        <register type="NOA" address="0x00009888" value="0x0F0700EF" />
+        <register type="NOA" address="0x00009888" value="0x25070000" />
+        <register type="NOA" address="0x00009888" value="0x11070000" />
+        <register type="NOA" address="0x00009888" value="0x23070000" />
+        <register type="NOA" address="0x00009888" value="0x1D070000" />
+        <register type="NOA" address="0x00009888" value="0x11004000" />
+        <register type="NOA" address="0x00009888" value="0x1F004000" />
+        <register type="NOA" address="0x00009888" value="0x21004000" />
+        <register type="NOA" address="0x00009888" value="0x23004000" />
+        <register type="NOA" address="0x00009888" value="0x25004000" />
+        <register type="NOA" address="0x00009888" value="0x27004000" />
+        <register type="NOA" address="0x00009888" value="0x29004000" />
+        <register type="NOA" address="0x00009888" value="0x2B004000" />
+        <register type="NOA" address="0x00009888" value="0x2D004000" />
+        <register type="NOA" address="0x00009888" value="0x2F004000" />
+        <register type="NOA" address="0x00009888" value="0x13004000" />
+        <register type="NOA" address="0x00009888" value="0x15004000" />
+        <register type="NOA" address="0x00009888" value="0x1D004000" />
+        <register type="NOA" address="0x00009888" value="0x47000000" />
+        <register type="NOA" address="0x00009888" value="0x39000003" />
+        <register type="NOA" address="0x00009888" value="0x49000000" />
+        <register type="NOA" address="0x00009888" value="0x3D000C63" />
+        <register type="NOA" address="0x00009888" value="0x4B000000" />
+        <register type="NOA" address="0x00009888" value="0x3F000C63" />
+        <register type="NOA" address="0x00009888" value="0x4D000000" />
+        <register type="NOA" address="0x00009888" value="0x41000C63" />
+        <register type="NOA" address="0x00009888" value="0x35000000" />
+        <register type="NOA" address="0x00009888" value="0x31000000" />
+        <register type="NOA" address="0x00009888" value="0x43000000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002770" value="0x0000081A" />
+        <register type="OA" address="0x00002774" value="0x0000FE00" />
+        <register type="OA" address="0x00002778" value="0x0000082A" />
+        <register type="OA" address="0x0000277C" value="0x0000FE00" />
+        <register type="OA" address="0x00002780" value="0x00000872" />
+        <register type="OA" address="0x00002784" value="0x0000FE00" />
+        <register type="OA" address="0x00002788" value="0x000008BA" />
+        <register type="OA" address="0x0000278C" value="0x0000FE00" />
+        <register type="OA" address="0x00002790" value="0x0000087A" />
+        <register type="OA" address="0x00002794" value="0x0000FE00" />
+        <register type="OA" address="0x00002798" value="0x000008EA" />
+        <register type="OA" address="0x0000279C" value="0x0000FE00" />
+        <register type="OA" address="0x000027A0" value="0x000008E2" />
+        <register type="OA" address="0x000027A4" value="0x0000FE00" />
+        <register type="OA" address="0x000027A8" value="0x000008F2" />
+        <register type="OA" address="0x000027AC" value="0x0000FE00" />
+        <register type="OA" address="0x0000274C" value="0x86543210" />
+        <register type="OA" address="0x00002744" value="0x00006667" />
+        <register type="OA" address="0x00002748" value="0x86543210" />
+        <register type="OA" address="0x0000275C" value="0x86543210" />
+        <register type="OA" address="0x00002754" value="0x00000065" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+    </register_config>
+  </set>
+
+  <set name="Memory Writes Distribution Gen10"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="memory_writes"
+       hw_config_guid="63d18ead-3cfc-4972-a640-5e98b688dfee"
+       chipset="CNL"
+       symbol_name="MemoryWrites"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiMemoryWrites"
+             description="The total number of GTI memory writes."
+             data_type="uint64"
+             equation="C 0 READ"
+             underscore_name="gti_memory_writes"
+             units="messages"
+             symbol_name="GtiMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="GtiRingAccesses"
+             description="The total number of all accesses from GTI to the ring."
+             data_type="uint64"
+             equation="C 7 READ"
+             underscore_name="gti_ring_accesses"
+             units="messages"
+             symbol_name="GtiRingAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="GtiMscMemoryWrites"
+             description="The total number of GTI memory writes from Multisampling Color Cache (Multisampling Color Cache invalidations)."
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="gti_msc_memory_writes"
+             units="messages"
+             symbol_name="GtiMscMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Color Cache"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="GtiCmdStreamerMemoryWrites"
+             description="The total number of GTI memory writes from Command Streamer."
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="gti_cmd_streamer_memory_writes"
+             units="messages"
+             symbol_name="GtiCmdStreamerMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Command Streamer"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GtiL3Bank0Writes"
+             description="The total number of GTI memory writes from L3 Bank 0 (L3 Bank 0 invalidations)."
+             data_type="uint64"
+             equation="C 1 READ"
+             underscore_name="gti_l3_bank0_writes"
+             units="messages"
+             symbol_name="GtiL3Bank0Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiL3Bank1Writes"
+             description="The total number of GTI memory writes from L3 Bank 1 (L3 Bank 1 invalidations)."
+             data_type="uint64"
+             equation="C 2 READ"
+             underscore_name="gti_l3_bank1_writes"
+             units="messages"
+             symbol_name="GtiL3Bank1Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiL3Bank2Writes"
+             description="The total number of GTI memory writes from L3 Bank 2 (L3 Bank 2 invalidations)."
+             data_type="uint64"
+             equation="C 3 READ"
+             underscore_name="gti_l3_bank2_writes"
+             units="messages"
+             symbol_name="GtiL3Bank2Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiL3Writes"
+             description="The total number of GTI memory writes from L3 (L3 invalidations)."
+             data_type="uint64"
+             equation="$GtiL3Bank0Writes $GtiL3Bank1Writes UADD $GtiL3Bank2Writes UADD"
+             underscore_name="gti_l3_writes"
+             units="messages"
+             symbol_name="GtiL3Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiRccMemoryWrites"
+             description="The total number of GTI memory writes from Render Color Cache (Render Color Cache invalidations)."
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="gti_rcc_memory_writes"
+             units="messages"
+             symbol_name="GtiRccMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Color Cache"
+             />
+    <counter name="GtiSoMemoryWrites"
+             description="The total number of GTI memory writes from Stream Output."
+             data_type="uint64"
+             equation="B 1 READ"
+             underscore_name="gti_so_memory_writes"
+             units="messages"
+             symbol_name="GtiSoMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Stream Output"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiStcMemoryWrites"
+             description="The total number of GTI memory writes from Stencil Cache."
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="gti_stc_memory_writes"
+             units="messages"
+             symbol_name="GtiStcMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="GtiRczMemoryWrites"
+             description="The total number of GTI memory writes from Render Depth Cache."
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="gti_rcz_memory_writes"
+             units="messages"
+             symbol_name="GtiRczMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ A 31 READ UADD A 32 READ UADD 64 UMUL"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiHizMemoryWrites"
+             description="The total number of GTI memory writes from Hierarchical Depth Cache."
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="gti_hiz_memory_writes"
+             units="messages"
+             symbol_name="GtiHizMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009884" value="0x00000007" />
+        <register type="NOA" address="0x00009888" value="0x17066860" />
+        <register type="NOA" address="0x00009888" value="0x15070017" />
+        <register type="NOA" address="0x00009888" value="0x1D073C00" />
+        <register type="NOA" address="0x00009888" value="0x1F07000E" />
+        <register type="NOA" address="0x00009888" value="0x1B038000" />
+        <register type="NOA" address="0x00009888" value="0x0D038000" />
+        <register type="NOA" address="0x00009888" value="0x0F034000" />
+        <register type="NOA" address="0x00009888" value="0x0F063180" />
+        <register type="NOA" address="0x00009888" value="0x01063100" />
+        <register type="NOA" address="0x00009888" value="0x0306006B" />
+        <register type="NOA" address="0x00009888" value="0x05060000" />
+        <register type="NOA" address="0x00009888" value="0x11080100" />
+        <register type="NOA" address="0x00009888" value="0x0D085000" />
+        <register type="NOA" address="0x00009888" value="0x0F094000" />
+        <register type="NOA" address="0x00009888" value="0x01094000" />
+        <register type="NOA" address="0x00009888" value="0x03091000" />
+        <register type="NOA" address="0x00009888" value="0x09046000" />
+        <register type="NOA" address="0x00009888" value="0x0F04A000" />
+        <register type="NOA" address="0x00009888" value="0x1104A800" />
+        <register type="NOA" address="0x00009888" value="0x130401AA" />
+        <register type="NOA" address="0x00009888" value="0x0B041000" />
+        <register type="NOA" address="0x00009888" value="0x010700D0" />
+        <register type="NOA" address="0x00009888" value="0x0707D153" />
+        <register type="NOA" address="0x00009888" value="0x0907D3D2" />
+        <register type="NOA" address="0x00009888" value="0x0B07D5D4" />
+        <register type="NOA" address="0x00009888" value="0x0D07D7D6" />
+        <register type="NOA" address="0x00009888" value="0x0F0700DF" />
+        <register type="NOA" address="0x00009888" value="0x25070000" />
+        <register type="NOA" address="0x00009888" value="0x11070000" />
+        <register type="NOA" address="0x00009888" value="0x23070000" />
+        <register type="NOA" address="0x00009888" value="0x11004000" />
+        <register type="NOA" address="0x00009888" value="0x1F004000" />
+        <register type="NOA" address="0x00009888" value="0x21004000" />
+        <register type="NOA" address="0x00009888" value="0x23004000" />
+        <register type="NOA" address="0x00009888" value="0x25004000" />
+        <register type="NOA" address="0x00009888" value="0x27004000" />
+        <register type="NOA" address="0x00009888" value="0x29004000" />
+        <register type="NOA" address="0x00009888" value="0x2B004000" />
+        <register type="NOA" address="0x00009888" value="0x2D004000" />
+        <register type="NOA" address="0x00009888" value="0x2F004000" />
+        <register type="NOA" address="0x00009888" value="0x13004000" />
+        <register type="NOA" address="0x00009888" value="0x15004000" />
+        <register type="NOA" address="0x00009888" value="0x1D004000" />
+        <register type="NOA" address="0x00009888" value="0x47000000" />
+        <register type="NOA" address="0x00009888" value="0x39000003" />
+        <register type="NOA" address="0x00009888" value="0x49000000" />
+        <register type="NOA" address="0x00009888" value="0x3D000C63" />
+        <register type="NOA" address="0x00009888" value="0x4B000000" />
+        <register type="NOA" address="0x00009888" value="0x3F000C63" />
+        <register type="NOA" address="0x00009888" value="0x4D000000" />
+        <register type="NOA" address="0x00009888" value="0x41000C63" />
+        <register type="NOA" address="0x00009888" value="0x35000000" />
+        <register type="NOA" address="0x00009888" value="0x31000000" />
+        <register type="NOA" address="0x00009888" value="0x43000000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x70800000" />
+        <register type="OA" address="0x00002770" value="0x0000081A" />
+        <register type="OA" address="0x00002774" value="0x0000FE00" />
+        <register type="OA" address="0x00002778" value="0x00000822" />
+        <register type="OA" address="0x0000277C" value="0x0000FE00" />
+        <register type="OA" address="0x00002780" value="0x000008BA" />
+        <register type="OA" address="0x00002784" value="0x0000FE00" />
+        <register type="OA" address="0x00002788" value="0x0000087A" />
+        <register type="OA" address="0x0000278C" value="0x0000FE00" />
+        <register type="OA" address="0x00002790" value="0x000008EA" />
+        <register type="OA" address="0x00002794" value="0x0000FE00" />
+        <register type="OA" address="0x00002798" value="0x000008E2" />
+        <register type="OA" address="0x0000279C" value="0x0000FE00" />
+        <register type="OA" address="0x000027A0" value="0x000008F2" />
+        <register type="OA" address="0x000027A4" value="0x0000FE00" />
+        <register type="OA" address="0x0000274C" value="0x65432108" />
+        <register type="OA" address="0x00002744" value="0x0000CCCE" />
+        <register type="OA" address="0x00002748" value="0x65432108" />
+        <register type="OA" address="0x0000275C" value="0x65432108" />
+        <register type="OA" address="0x00002754" value="0x000000CA" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+    </register_config>
+  </set>
+
+  <set name="Compute Metrics Extended Gen10"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="compute_extended"
+       hw_config_guid="1b4d1280-6bbd-4d57-90c6-a03ed6059688"
+       chipset="CNL"
+       symbol_name="ComputeExtended"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU AVG IPC Rate"
+             description="The average rate of IPC calculated for 2 FPU pipelines."
+             data_type="float"
+             max_equation="2"
+             equation="A 9 READ A 10 READ A 11 READ FADD A 9 READ FSUB FDIV 1 FADD"
+             underscore_name="eu_avg_ipc_rate"
+             units="number"
+             symbol_name="EuAvgIpcRate"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Typed Writes 0"
+             description="The subslice 0 typed writes."
+             data_type="uint64"
+             equation="C 4 READ"
+             underscore_name="typed_writes0"
+             units="messages"
+             symbol_name="TypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuTypedAtomics0"
+             description="The subslice 0 EU Typed Atomics subslice 0."
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="eu_typed_atomics0"
+             units="messages"
+             symbol_name="EuTypedAtomics0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Typed Atomics 0"
+             description="The subslice 0 typed atomics."
+             data_type="uint64"
+             equation="C 5 READ"
+             underscore_name="typed_atomics0"
+             units="messages"
+             symbol_name="TypedAtomics0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="TypedAtomicsPerCacheLine"
+             description="The ratio of EU typed atomics requests to L3 cache line writes."
+             data_type="float"
+             equation="$EuTypedAtomics0 $TypedAtomics0 FDIV"
+             underscore_name="typed_atomics_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="TypedAtomicsPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuUntypedReads0"
+             description="The subslice 0 EU Untyped Reads subslice 0."
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="eu_untyped_reads0"
+             units="messages"
+             symbol_name="EuUntypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Untyped Writes 0"
+             description="The subslice 0 untyped writes (including SLM writes)."
+             data_type="uint64"
+             equation="C 2 READ"
+             underscore_name="untyped_writes0"
+             units="messages"
+             symbol_name="UntypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EU FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active"
+             units="percent"
+             symbol_name="Fpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu0_active"
+             units="percent"
+             symbol_name="Fpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EuUntypedAtomics0"
+             description="The subslice 0 EU Untyped Atomics subslice 0."
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="eu_untyped_atomics0"
+             units="messages"
+             symbol_name="EuUntypedAtomics0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuUntypedWrites0"
+             description="The subslice 0 EU Untyped Writes subslice 0."
+             data_type="uint64"
+             equation="B 1 READ"
+             underscore_name="eu_untyped_writes0"
+             units="messages"
+             symbol_name="EuUntypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuA64UntypedWrites0"
+             description="The subslice 0 EU A64 Untyped Writes subslice 0."
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="eu_a64_untyped_writes0"
+             units="messages"
+             symbol_name="EuA64UntypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="UntypedWritesPerCacheLine"
+             description="The ratio of EU untyped write requests to L3 cache line writes."
+             data_type="float"
+             equation="$EuUntypedWrites0 $EuA64UntypedWrites0 FADD $UntypedWrites0 FDIV"
+             underscore_name="untyped_writes_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="UntypedWritesPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EuTypedWrites0"
+             description="The subslice 0 EU Typed Writes subslice 0."
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="eu_typed_writes0"
+             units="messages"
+             symbol_name="EuTypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="TypedWritesPerCacheLine"
+             description="The ratio of EU typed write requests to L3 cache line writes."
+             data_type="float"
+             equation="$EuTypedWrites0 $TypedWrites0 FDIV"
+             underscore_name="typed_writes_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="TypedWritesPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Typed Reads 0"
+             description="The subslice 0 typed reads."
+             data_type="uint64"
+             equation="C 3 READ"
+             underscore_name="typed_reads0"
+             units="messages"
+             symbol_name="TypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Untyped Reads 0"
+             description="The subslice 0 untyped reads (including SLM reads)."
+             data_type="uint64"
+             equation="C 1 READ"
+             underscore_name="untyped_reads0"
+             units="messages"
+             symbol_name="UntypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuA64UntypedReads0"
+             description="The subslice 0 EU A64 Untyped Reads subslice 0."
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="eu_a64_untyped_reads0"
+             units="messages"
+             symbol_name="EuA64UntypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EU Thread Occupancy"
+             description="The percentage of time in which hardware threads occupied EUs."
+             data_type="float"
+             max_equation="100"
+             equation="8 A 13 READ FMUL $EuThreadsCount FDIV $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_thread_occupancy"
+             units="percent"
+             symbol_name="EuThreadOccupancy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EuTypedReads0"
+             description="The subslice 0 EU Typed Reads subslice 0."
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="eu_typed_reads0"
+             units="messages"
+             symbol_name="EuTypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="UntypedReadsPerCacheLine"
+             description="The ratio of EU untyped read requests to L3 cache line reads."
+             data_type="float"
+             equation="$EuUntypedReads0 $EuA64UntypedReads0 FADD $UntypedReads0 FDIV"
+             underscore_name="untyped_reads_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="UntypedReadsPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="TypedReadsPerCacheLine"
+             description="The ratio of EU typed read requests to L3 cache line reads."
+             data_type="float"
+             equation="$EuTypedReads0 $TypedReads0 FDIV"
+             underscore_name="typed_reads_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="TypedReadsPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ A 31 READ UADD A 32 READ UADD 64 UMUL"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="EU Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_send_active"
+             units="percent"
+             symbol_name="EuSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA"
+                     availability="$SubsliceMask 1 AND"
+                     priority="0"
+                     >
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x121A0007" />
+        <register type="NOA" address="0x00009888" value="0x101A0000" />
+        <register type="NOA" address="0x00009888" value="0x121B000B" />
+        <register type="NOA" address="0x00009888" value="0x161B0009" />
+        <register type="NOA" address="0x00009888" value="0x0474A000" />
+        <register type="NOA" address="0x00009888" value="0x0A748000" />
+        <register type="NOA" address="0x00009888" value="0x0C74A000" />
+        <register type="NOA" address="0x00009888" value="0x0E74A000" />
+        <register type="NOA" address="0x00009888" value="0x12741540" />
+        <register type="NOA" address="0x00009888" value="0x0674A000" />
+        <register type="NOA" address="0x00009888" value="0x08742000" />
+        <register type="NOA" address="0x00009888" value="0x0475A000" />
+        <register type="NOA" address="0x00009888" value="0x0A758000" />
+        <register type="NOA" address="0x00009888" value="0x0C75A000" />
+        <register type="NOA" address="0x00009888" value="0x0E75A000" />
+        <register type="NOA" address="0x00009888" value="0x147500AA" />
+        <register type="NOA" address="0x00009888" value="0x0675A000" />
+        <register type="NOA" address="0x00009888" value="0x08752000" />
+        <register type="NOA" address="0x00009888" value="0x0C76A800" />
+        <register type="NOA" address="0x00009888" value="0x0E76AA0A" />
+        <register type="NOA" address="0x00009888" value="0x107602AA" />
+        <register type="NOA" address="0x00009888" value="0x0077C000" />
+        <register type="NOA" address="0x00009888" value="0x0E77C000" />
+        <register type="NOA" address="0x00009888" value="0x1477C000" />
+        <register type="NOA" address="0x00009888" value="0x1677FFF0" />
+        <register type="NOA" address="0x00009888" value="0x18770003" />
+        <register type="NOA" address="0x00009888" value="0x0277C000" />
+        <register type="NOA" address="0x00009888" value="0x0477C000" />
+        <register type="NOA" address="0x00009888" value="0x0677C000" />
+        <register type="NOA" address="0x00009888" value="0x0877C000" />
+        <register type="NOA" address="0x00009888" value="0x00198000" />
+        <register type="NOA" address="0x00009888" value="0x0E198000" />
+        <register type="NOA" address="0x00009888" value="0x1A195540" />
+        <register type="NOA" address="0x00009888" value="0x1C19003A" />
+        <register type="NOA" address="0x00009888" value="0x0219C000" />
+        <register type="NOA" address="0x00009888" value="0x0419C000" />
+        <register type="NOA" address="0x00009888" value="0x0619C000" />
+        <register type="NOA" address="0x00009888" value="0x0819C000" />
+        <register type="NOA" address="0x00009888" value="0x0E1A2A00" />
+        <register type="NOA" address="0x00009888" value="0x001A2980" />
+        <register type="NOA" address="0x00009888" value="0x021A2CDA" />
+        <register type="NOA" address="0x00009888" value="0x041A0058" />
+        <register type="NOA" address="0x00009888" value="0x001B0011" />
+        <register type="NOA" address="0x00009888" value="0x061B0900" />
+        <register type="NOA" address="0x00009888" value="0x081B0A13" />
+        <register type="NOA" address="0x00009888" value="0x0A1B0B15" />
+        <register type="NOA" address="0x00009888" value="0x0C1B2317" />
+        <register type="NOA" address="0x00009888" value="0x0E1B0043" />
+        <register type="NOA" address="0x00009888" value="0x101B0000" />
+        <register type="NOA" address="0x00009888" value="0x10178000" />
+        <register type="NOA" address="0x00009888" value="0x1C1701FE" />
+        <register type="NOA" address="0x00009884" value="0x00000007" />
+        <register type="NOA" address="0x00009888" value="0x1100C000" />
+        <register type="NOA" address="0x00009888" value="0x1F00C000" />
+        <register type="NOA" address="0x00009888" value="0x2100C000" />
+        <register type="NOA" address="0x00009888" value="0x2300C000" />
+        <register type="NOA" address="0x00009888" value="0x2500C000" />
+        <register type="NOA" address="0x00009888" value="0x2700C000" />
+        <register type="NOA" address="0x00009888" value="0x2900C000" />
+        <register type="NOA" address="0x00009888" value="0x2B00C000" />
+        <register type="NOA" address="0x00009888" value="0x2D00C000" />
+        <register type="NOA" address="0x00009888" value="0x2F00C000" />
+        <register type="NOA" address="0x00009888" value="0x1300C000" />
+        <register type="NOA" address="0x00009888" value="0x1500C000" />
+        <register type="NOA" address="0x00009888" value="0x1700C000" />
+        <register type="NOA" address="0x00009888" value="0x1900C000" />
+        <register type="NOA" address="0x00009888" value="0x47000000" />
+        <register type="NOA" address="0x00009888" value="0x39000420" />
+        <register type="NOA" address="0x00009888" value="0x49000000" />
+        <register type="NOA" address="0x00009888" value="0x3D000000" />
+        <register type="NOA" address="0x00009888" value="0x4B000000" />
+        <register type="NOA" address="0x00009888" value="0x3F000000" />
+        <register type="NOA" address="0x00009888" value="0x4D000000" />
+        <register type="NOA" address="0x00009888" value="0x41000000" />
+        <register type="NOA" address="0x00009888" value="0x35000000" />
+        <register type="NOA" address="0x00009888" value="0x31000000" />
+        <register type="NOA" address="0x00009888" value="0x43000001" />
+        <register type="NOA" address="0x00009888" value="0x3B000021" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002770" value="0x00000C2A" />
+        <register type="OA" address="0x00002774" value="0x0000FE00" />
+        <register type="OA" address="0x00002778" value="0x00000C6A" />
+        <register type="OA" address="0x0000277C" value="0x0000FE00" />
+        <register type="OA" address="0x00002780" value="0x00000C32" />
+        <register type="OA" address="0x00002784" value="0x0000FE00" />
+        <register type="OA" address="0x00002788" value="0x00000E6A" />
+        <register type="OA" address="0x0000278C" value="0x0000FE00" />
+        <register type="OA" address="0x00002790" value="0x00000E7A" />
+        <register type="OA" address="0x00002794" value="0x0000FE00" />
+        <register type="OA" address="0x00002798" value="0x00000C92" />
+        <register type="OA" address="0x0000279C" value="0x0000FE00" />
+        <register type="OA" address="0x000027A0" value="0x00000CA2" />
+        <register type="OA" address="0x000027A4" value="0x0000FE00" />
+        <register type="OA" address="0x000027A8" value="0x00000C9A" />
+        <register type="OA" address="0x000027AC" value="0x0000FE00" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00000003" />
+        <register type="FLEX" address="0x0000E658" value="0x00002001" />
+        <register type="FLEX" address="0x0000E758" value="0x00000008" />
+    </register_config>
+  </set>
+
+  <set name="Compute Metrics L3 Cache Gen10"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="compute_l3_cache"
+       hw_config_guid="f3b31b5a-00b3-4fb4-81fd-6446e505534c"
+       chipset="CNL"
+       symbol_name="ComputeL3Cache"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Misses"
+             description="The total number of L3 misses."
+             data_type="uint64"
+             equation="C 2 READ C 3 READ UADD"
+             underscore_name="l3_misses"
+             units="messages"
+             symbol_name="L3Misses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/TAG"
+             />
+    <counter name="GTI L3 Throughput"
+             description="The total number of GPU memory bytes transferred between L3 caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="$L3Misses 64 UMUL"
+             underscore_name="gti_l3_throughput"
+             units="bytes"
+             symbol_name="GtiL3Throughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank0 Accesses"
+             description="The total number of accesses to Slice0 L3 Bank0."
+             data_type="uint64"
+             equation="B 0 READ 2 UMUL"
+             underscore_name="l3_bank00_accesses"
+             units="messages"
+             symbol_name="L3Bank00Accesses"
+             availability="$SliceMask 1 AND"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="Slice0 L3 Bank1 Accesses"
+             description="The total number of accesses to Slice0 L3 Bank1."
+             data_type="uint64"
+             equation="B 1 READ 2 UMUL"
+             underscore_name="l3_bank01_accesses"
+             units="messages"
+             symbol_name="L3Bank01Accesses"
+             availability="$SliceMask 1 AND"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="Slice0 L3 Bank2 Accesses"
+             description="The total number of accesses to Slice0 L3 Bank2."
+             data_type="uint64"
+             equation="B 2 READ 2 UMUL"
+             underscore_name="l3_bank02_accesses"
+             units="messages"
+             symbol_name="L3Bank02Accesses"
+             availability="$SliceMask 1 AND"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="Slice1 L3 Bank0 Accesses"
+             description="The total number of accesses to Slice1 L3 Bank0."
+             data_type="uint64"
+             equation="B 3 READ 2 UMUL"
+             underscore_name="l3_bank10_accesses"
+             units="messages"
+             symbol_name="L3Bank10Accesses"
+             availability="$SliceMask 2 AND"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="Slice1 L3 Bank1 Accesses"
+             description="The total number of accesses to Slice1 L3 Bank1."
+             data_type="uint64"
+             equation="B 4 READ 2 UMUL"
+             underscore_name="l3_bank11_accesses"
+             units="messages"
+             symbol_name="L3Bank11Accesses"
+             availability="$SliceMask 2 AND"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="Slice1 L3 Bank2 Accesses"
+             description="The total number of accesses to Slice1 L3 Bank2."
+             data_type="uint64"
+             equation="B 5 READ 2 UMUL"
+             underscore_name="l3_bank12_accesses"
+             units="messages"
+             symbol_name="L3Bank12Accesses"
+             availability="$SliceMask 2 AND"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="L3 Accesses"
+             description="The total number of L3 accesses from all entities."
+             data_type="uint64"
+             equation="$L3Bank00Accesses $L3Bank01Accesses UADD $L3Bank02Accesses UADD $L3Bank10Accesses UADD $L3Bank11Accesses UADD $L3Bank12Accesses UADD"
+             underscore_name="l3_accesses"
+             units="messages"
+             symbol_name="L3Accesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Sampler Throughput"
+             description="The total number of GPU memory bytes transferred between samplers and L3 caches."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="64  $SliceMask 1 AND C 4 READ UMUL $SliceMask 1 >> 1 AND C 5 READ UMUL UADD 8 UMUL UMUL"
+             underscore_name="l3_sampler_throughput"
+             units="bytes"
+             symbol_name="L3SamplerThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Sampler"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU AVG IPC Rate"
+             description="The average rate of IPC calculated for 2 FPU pipelines."
+             data_type="float"
+             max_equation="2"
+             equation="A 9 READ A 10 READ A 11 READ FADD A 9 READ FSUB FDIV 1 FADD"
+             underscore_name="eu_avg_ipc_rate"
+             units="number"
+             symbol_name="EuAvgIpcRate"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Binary Instruction"
+             description="The percentage of time in which execution units were actively processing binary instructions on FPU0."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_binary_fpu0_instruction"
+             units="percent"
+             symbol_name="EuBinaryFpu0Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="EU FPU0 Hybrid Instruction"
+             description="The percentage of time in which execution units were actively processing hybrid instructions on FPU0."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_hybrid_fpu0_instruction"
+             units="percent"
+             symbol_name="EuHybridFpu0Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active"
+             units="percent"
+             symbol_name="Fpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu0_active"
+             units="percent"
+             symbol_name="Fpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="EU FPU0 Move Instruction"
+             description="The percentage of time in which execution units were actively processing move instructions on FPU0."
+             data_type="float"
+             max_equation="100"
+             equation="A 19 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_move_fpu0_instruction"
+             units="percent"
+             symbol_name="EuMoveFpu0Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Accesses"
+             description="The total number of messages send to samplers."
+             data_type="uint64"
+             equation="A 28 READ"
+             underscore_name="sampler_accesses"
+             units="messages"
+             symbol_name="SamplerAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="$SamplerAccesses 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU FPU1 Hybrid Instruction"
+             description="The percentage of time in which execution units were actively processing hybrid instructions on FPU1."
+             data_type="float"
+             max_equation="100"
+             equation="A 14 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_hybrid_fpu1_instruction"
+             units="percent"
+             symbol_name="EuHybridFpu1Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="L3 Lookup Accesses w/o IC"
+             description="The total number of L3 cache lookup accesses w/o IC."
+             data_type="uint64"
+             equation="$SliceMask 1 AND C 4 READ UMUL $SliceMask 1 >> 1 AND C 5 READ UMUL UADD 8 UMUL A 32 READ UADD"
+             underscore_name="l3_lookups"
+             units="messages"
+             symbol_name="L3Lookups"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/TAG"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Read Throughput"
+             description="The total number of GPU memory bytes read from GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="64  C 6 READ UMUL"
+             underscore_name="gti_read_throughput"
+             units="bytes"
+             symbol_name="GtiReadThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Ternary Instruction"
+             description="The percentage of time in which execution units were actively processing ternary instructions on FPU0."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_ternary_fpu0_instruction"
+             units="percent"
+             symbol_name="EuTernaryFpu0Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU FPU1 Move Instruction"
+             description="The percentage of time in which execution units were actively processing move instructions on FPU1."
+             data_type="float"
+             max_equation="100"
+             equation="A 20 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_move_fpu1_instruction"
+             units="percent"
+             symbol_name="EuMoveFpu1Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="L3 Total Throughput"
+             description="The total number of GPU memory bytes transferred via L3."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="$L3Accesses 64 UMUL"
+             underscore_name="l3_total_throughput"
+             units="bytes"
+             symbol_name="L3TotalThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Write Throughput"
+             description="The total number of GPU memory bytes written to GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="64  C 7 READ UMUL"
+             underscore_name="gti_write_throughput"
+             units="bytes"
+             symbol_name="GtiWriteThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ A 31 READ UADD A 32 READ UADD 64 UMUL"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Binary Instruction"
+             description="The percentage of time in which execution units were actively processing binary instructions on FPU1."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_binary_fpu1_instruction"
+             units="percent"
+             symbol_name="EuBinaryFpu1Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Ternary Instruction"
+             description="The percentage of time in which execution units were actively processing ternary instructions on FPU1."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_ternary_fpu1_instruction"
+             units="percent"
+             symbol_name="EuTernaryFpu1Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_send_active"
+             units="percent"
+             symbol_name="EuSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x146C0080" />
+        <register type="NOA" address="0x00009888" value="0x14EC0080" />
+        <register type="NOA" address="0x00009888" value="0x006C0050" />
+        <register type="NOA" address="0x00009888" value="0x066C5100" />
+        <register type="NOA" address="0x00009888" value="0x086C0052" />
+        <register type="NOA" address="0x00009888" value="0x026C5C00" />
+        <register type="NOA" address="0x00009888" value="0x106C0000" />
+        <register type="NOA" address="0x00009888" value="0x186C0800" />
+        <register type="NOA" address="0x00009888" value="0x1A6C0540" />
+        <register type="NOA" address="0x00009888" value="0x00739000" />
+        <register type="NOA" address="0x00009888" value="0x02739000" />
+        <register type="NOA" address="0x00009888" value="0x0473F000" />
+        <register type="NOA" address="0x00009888" value="0x00778000" />
+        <register type="NOA" address="0x00009888" value="0x0E778000" />
+        <register type="NOA" address="0x00009888" value="0x14778000" />
+        <register type="NOA" address="0x00009888" value="0x167702A0" />
+        <register type="NOA" address="0x00009888" value="0x06778000" />
+        <register type="NOA" address="0x00009888" value="0x08778000" />
+        <register type="NOA" address="0x00009888" value="0x08EC5000" />
+        <register type="NOA" address="0x00009888" value="0x0AEC5251" />
+        <register type="NOA" address="0x00009888" value="0x04EC005C" />
+        <register type="NOA" address="0x00009888" value="0x10EC0000" />
+        <register type="NOA" address="0x00009888" value="0x1AEC0000" />
+        <register type="NOA" address="0x00009888" value="0x18EC0000" />
+        <register type="NOA" address="0x00009888" value="0x04F3E000" />
+        <register type="NOA" address="0x00009888" value="0x02F31000" />
+        <register type="NOA" address="0x00009888" value="0x16F702A0" />
+        <register type="NOA" address="0x00009888" value="0x08F78000" />
+        <register type="NOA" address="0x00009884" value="0x00000007" />
+        <register type="NOA" address="0x00009888" value="0x0B080360" />
+        <register type="NOA" address="0x00009888" value="0x1D073800" />
+        <register type="NOA" address="0x00009888" value="0x1F070140" />
+        <register type="NOA" address="0x00009888" value="0x01081060" />
+        <register type="NOA" address="0x00009888" value="0x0D080000" />
+        <register type="NOA" address="0x00009888" value="0x01094000" />
+        <register type="NOA" address="0x00009888" value="0x03091000" />
+        <register type="NOA" address="0x00009888" value="0x09044000" />
+        <register type="NOA" address="0x00009888" value="0x0B041000" />
+        <register type="NOA" address="0x00009888" value="0x0D048000" />
+        <register type="NOA" address="0x00009888" value="0x0F042000" />
+        <register type="NOA" address="0x00009888" value="0x0507E700" />
+        <register type="NOA" address="0x00009888" value="0x070700D7" />
+        <register type="NOA" address="0x00009888" value="0x25070000" />
+        <register type="NOA" address="0x00009888" value="0x1B070000" />
+        <register type="NOA" address="0x00009888" value="0x1100C000" />
+        <register type="NOA" address="0x00009888" value="0x1F00C000" />
+        <register type="NOA" address="0x00009888" value="0x2100C000" />
+        <register type="NOA" address="0x00009888" value="0x2300C000" />
+        <register type="NOA" address="0x00009888" value="0x2500C000" />
+        <register type="NOA" address="0x00009888" value="0x2700C000" />
+        <register type="NOA" address="0x00009888" value="0x13004000" />
+        <register type="NOA" address="0x00009888" value="0x15004000" />
+        <register type="NOA" address="0x00009888" value="0x1700C000" />
+        <register type="NOA" address="0x00009888" value="0x1900C000" />
+        <register type="NOA" address="0x00009888" value="0x1B004000" />
+        <register type="NOA" address="0x00009888" value="0x1D004000" />
+        <register type="NOA" address="0x00009888" value="0x47001111" />
+        <register type="NOA" address="0x00009888" value="0x39002101" />
+        <register type="NOA" address="0x00009888" value="0x49001110" />
+        <register type="NOA" address="0x00009888" value="0x3D000429" />
+        <register type="NOA" address="0x00009888" value="0x4B000001" />
+        <register type="NOA" address="0x00009888" value="0x3F000000" />
+        <register type="NOA" address="0x00009888" value="0x35000000" />
+        <register type="NOA" address="0x00009888" value="0x31000000" />
+        <register type="NOA" address="0x00009888" value="0x3B002401" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00000003" />
+        <register type="FLEX" address="0x0000E658" value="0x00002001" />
+        <register type="FLEX" address="0x0000E758" value="0x00101100" />
+        <register type="FLEX" address="0x0000E45C" value="0x00201200" />
+        <register type="FLEX" address="0x0000E55C" value="0x00301300" />
+        <register type="FLEX" address="0x0000E65C" value="0x00401400" />
+    </register_config>
+  </set>
+
+  <set name="Metric set HDCAndSF"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="hdc_and_sf"
+       hw_config_guid="890094c5-8615-4f69-a8b9-706c5bcbd713"
+       chipset="CNL"
+       symbol_name="HDCAndSF"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="Polygon Data Ready"
+             description="The percentage of time in which geometry pipeline output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="poly_data_ready"
+             units="percent"
+             symbol_name="PolyDataReady"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe/Strip-Fans"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="Slice0 Subslice1 Non-sampler Shader Access Stalled On L3"
+             description="Percentage of time when HDC has messages to L3, but it's stalled due to lack of credits (Slice0 Subslice1)"
+             data_type="float"
+             max_equation="100"
+             equation="B 4 READ B 5 READ FSUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader01_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader01AccessStalledOnL3"
+             availability="$SubsliceMask 2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="Slice0 Subslice2 Non-sampler Shader Access Stalled On L3"
+             description="Percentage of time when HDC has messages to L3, but it's stalled due to lack of credits (Slice0 Subslice2)"
+             data_type="float"
+             max_equation="100"
+             equation="B 6 READ B 7 READ FSUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader02_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader02AccessStalledOnL3"
+             availability="$SubsliceMask 4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice1 Subslice0 Non-sampler Shader Access Stalled On L3"
+             description="Percentage of time when HDC has messages to L3, but it's stalled due to lack of credits (Slice1 Subslice0)"
+             data_type="float"
+             max_equation="100"
+             equation="C 0 READ C 1 READ FSUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader10_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader10AccessStalledOnL3"
+             availability="$SubsliceMask 8 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="Slice1 Subslice1 Non-sampler Shader Access Stalled On L3"
+             description="Percentage of time when HDC has messages to L3, but it's stalled due to lack of credits (Slice1 Subslice1)"
+             data_type="float"
+             max_equation="100"
+             equation="C 2 READ C 3 READ FSUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader11_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader11AccessStalledOnL3"
+             availability="$SubsliceMask 16 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ A 31 READ UADD A 32 READ UADD 64 UMUL"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Slice0 Subslice0 Non-sampler Shader Access Stalled On L3"
+             description="Percentage of time when HDC has messages to L3, but it's stalled due to lack of credits (Slice0 Subslice0)"
+             data_type="float"
+             max_equation="100"
+             equation="B 2 READ B 3 READ FSUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader00_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader00AccessStalledOnL3"
+             availability="$SubsliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x121A0011" />
+        <register type="NOA" address="0x00009888" value="0x123A0011" />
+        <register type="NOA" address="0x00009888" value="0x129A0011" />
+        <register type="NOA" address="0x00009888" value="0x12BA0011" />
+        <register type="NOA" address="0x00009888" value="0x125A0011" />
+        <register type="NOA" address="0x00009888" value="0x1C6C0005" />
+        <register type="NOA" address="0x00009888" value="0x186C00A0" />
+        <register type="NOA" address="0x00009888" value="0x0673C000" />
+        <register type="NOA" address="0x00009888" value="0x00736000" />
+        <register type="NOA" address="0x00009888" value="0x0C74A000" />
+        <register type="NOA" address="0x00009888" value="0x0C75A000" />
+        <register type="NOA" address="0x00009888" value="0x0E762800" />
+        <register type="NOA" address="0x00009888" value="0x1477C000" />
+        <register type="NOA" address="0x00009888" value="0x16779570" />
+        <register type="NOA" address="0x00009888" value="0x18770002" />
+        <register type="NOA" address="0x00009888" value="0x02778000" />
+        <register type="NOA" address="0x00009888" value="0x04778000" />
+        <register type="NOA" address="0x00009888" value="0x0A7B8000" />
+        <register type="NOA" address="0x00009888" value="0x0C7B002A" />
+        <register type="NOA" address="0x00009888" value="0x147C8000" />
+        <register type="NOA" address="0x00009888" value="0x167C003E" />
+        <register type="NOA" address="0x00009888" value="0x1E7D0028" />
+        <register type="NOA" address="0x00009888" value="0x1A1901E0" />
+        <register type="NOA" address="0x00009888" value="0x081A2B50" />
+        <register type="NOA" address="0x00009888" value="0x001A0000" />
+        <register type="NOA" address="0x00009888" value="0x1A391E00" />
+        <register type="NOA" address="0x00009888" value="0x0A3A2B50" />
+        <register type="NOA" address="0x00009888" value="0x003A0000" />
+        <register type="NOA" address="0x00009888" value="0x12F41400" />
+        <register type="NOA" address="0x00009888" value="0x14F500A0" />
+        <register type="NOA" address="0x00009888" value="0x10F60280" />
+        <register type="NOA" address="0x00009888" value="0x16F7C000" />
+        <register type="NOA" address="0x00009888" value="0x18F70003" />
+        <register type="NOA" address="0x00009888" value="0x02F74000" />
+        <register type="NOA" address="0x00009888" value="0x04F74000" />
+        <register type="NOA" address="0x00009888" value="0x08FBA000" />
+        <register type="NOA" address="0x00009888" value="0x02FC8000" />
+        <register type="NOA" address="0x00009888" value="0x04FC8000" />
+        <register type="NOA" address="0x00009888" value="0x1CFD000A" />
+        <register type="NOA" address="0x00009888" value="0x1C99003C" />
+        <register type="NOA" address="0x00009888" value="0x0E9A2B50" />
+        <register type="NOA" address="0x00009888" value="0x009A0000" />
+        <register type="NOA" address="0x00009888" value="0x02B9C000" />
+        <register type="NOA" address="0x00009888" value="0x04B9C000" />
+        <register type="NOA" address="0x00009888" value="0x00BA2800" />
+        <register type="NOA" address="0x00009888" value="0x02BA0056" />
+        <register type="NOA" address="0x00009888" value="0x1A596000" />
+        <register type="NOA" address="0x00009888" value="0x1C590003" />
+        <register type="NOA" address="0x00009888" value="0x0C5A2B50" />
+        <register type="NOA" address="0x00009888" value="0x005A0000" />
+        <register type="NOA" address="0x00009884" value="0x00000007" />
+        <register type="NOA" address="0x00009888" value="0x130E03C0" />
+        <register type="NOA" address="0x00009888" value="0x2100F000" />
+        <register type="NOA" address="0x00009888" value="0x01181000" />
+        <register type="NOA" address="0x00009888" value="0x010E0030" />
+        <register type="NOA" address="0x00009888" value="0x110E0000" />
+        <register type="NOA" address="0x00009888" value="0x01104000" />
+        <register type="NOA" address="0x00009888" value="0x01118000" />
+        <register type="NOA" address="0x00009888" value="0x0B142000" />
+        <register type="NOA" address="0x00009888" value="0x01092000" />
+        <register type="NOA" address="0x00009888" value="0x010B4000" />
+        <register type="NOA" address="0x00009888" value="0x09041000" />
+        <register type="NOA" address="0x00009888" value="0x1D000071" />
+        <register type="NOA" address="0x00009888" value="0x33000000" />
+        <register type="NOA" address="0x00009888" value="0x11004000" />
+        <register type="NOA" address="0x00009888" value="0x2300C000" />
+        <register type="NOA" address="0x00009888" value="0x2500C000" />
+        <register type="NOA" address="0x00009888" value="0x2700C000" />
+        <register type="NOA" address="0x00009888" value="0x2900C000" />
+        <register type="NOA" address="0x00009888" value="0x2B00C000" />
+        <register type="NOA" address="0x00009888" value="0x2D00C000" />
+        <register type="NOA" address="0x00009888" value="0x2F00C000" />
+        <register type="NOA" address="0x00009888" value="0x1300C000" />
+        <register type="NOA" address="0x00009888" value="0x1500C000" />
+        <register type="NOA" address="0x00009888" value="0x47000003" />
+        <register type="NOA" address="0x00009888" value="0x39000000" />
+        <register type="NOA" address="0x00009888" value="0x4B001111" />
+        <register type="NOA" address="0x00009888" value="0x3D000408" />
+        <register type="NOA" address="0x00009888" value="0x3F000421" />
+        <register type="NOA" address="0x00009888" value="0x4D000000" />
+        <register type="NOA" address="0x00009888" value="0x41000084" />
+        <register type="NOA" address="0x00009888" value="0x35000000" />
+        <register type="NOA" address="0x00009888" value="0x31000000" />
+        <register type="NOA" address="0x00009888" value="0x43000000" />
+        <register type="NOA" address="0x00009888" value="0x49000300" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x10800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00000002" />
+        <register type="OA" address="0x00002774" value="0x0000FFFE" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+    </register_config>
+  </set>
+
+  <set name="Metric set L3_1"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="l3_1"
+       hw_config_guid="e56f7dd7-ff55-4bae-89a1-a526a2e3b0d6"
+       chipset="CNL"
+       symbol_name="L3_1"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank1 Active"
+             description="The percentage of time in which slice0 L3 bank1 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank1_active"
+             units="percent"
+             symbol_name="L30Bank1Active"
+             availability="$SliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="Slice0 L3 Bank1 Stalled"
+             description="The percentage of time in which slice0 L3 bank1 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank1_stalled"
+             units="percent"
+             symbol_name="L30Bank1Stalled"
+             availability="$SliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank2 Active"
+             description="The percentage of time in which slice0 L3 bank2 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank2_active"
+             units="percent"
+             symbol_name="L30Bank2Active"
+             availability="$SliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Slice0 L3 Bank0 Active"
+             description="The percentage of time in which slice0 L3 bank0 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank0_active"
+             units="percent"
+             symbol_name="L30Bank0Active"
+             availability="$SliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="Slice1 L3 Bank2 Stalled"
+             description="The percentage of time in which slice1 L3 bank2 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l31_bank2_stalled"
+             units="percent"
+             symbol_name="L31Bank2Stalled"
+             availability="$SliceMask 2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank0 Stalled"
+             description="The percentage of time in which slice0 L3 bank0 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank0_stalled"
+             units="percent"
+             symbol_name="L30Bank0Stalled"
+             availability="$SliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ A 31 READ UADD A 32 READ UADD 64 UMUL"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x1661001A" />
+        <register type="NOA" address="0x00009888" value="0x1665001A" />
+        <register type="NOA" address="0x00009888" value="0x1669001A" />
+        <register type="NOA" address="0x00009888" value="0x106C1C00" />
+        <register type="NOA" address="0x00009888" value="0x126C0004" />
+        <register type="NOA" address="0x00009888" value="0x166C001D" />
+        <register type="NOA" address="0x00009888" value="0x10EC0400" />
+        <register type="NOA" address="0x00009888" value="0x16EC0000" />
+        <register type="NOA" address="0x00009888" value="0x02610024" />
+        <register type="NOA" address="0x00009888" value="0x10610000" />
+        <register type="NOA" address="0x00009888" value="0x1E610000" />
+        <register type="NOA" address="0x00009888" value="0x02652400" />
+        <register type="NOA" address="0x00009888" value="0x10650000" />
+        <register type="NOA" address="0x00009888" value="0x1E650000" />
+        <register type="NOA" address="0x00009888" value="0x04690024" />
+        <register type="NOA" address="0x00009888" value="0x10690000" />
+        <register type="NOA" address="0x00009888" value="0x1E690000" />
+        <register type="NOA" address="0x00009888" value="0x006C0020" />
+        <register type="NOA" address="0x00009888" value="0x066C2800" />
+        <register type="NOA" address="0x00009888" value="0x0A6C2820" />
+        <register type="NOA" address="0x00009888" value="0x0E6C3832" />
+        <register type="NOA" address="0x00009888" value="0x186C05A0" />
+        <register type="NOA" address="0x00009888" value="0x1A6C1010" />
+        <register type="NOA" address="0x00009888" value="0x1C6C0000" />
+        <register type="NOA" address="0x00009888" value="0x186D8000" />
+        <register type="NOA" address="0x00009888" value="0x0A6E1000" />
+        <register type="NOA" address="0x00009888" value="0x0073F000" />
+        <register type="NOA" address="0x00009888" value="0x02738000" />
+        <register type="NOA" address="0x00009888" value="0x0473D000" />
+        <register type="NOA" address="0x00009888" value="0x0673D000" />
+        <register type="NOA" address="0x00009888" value="0x00778000" />
+        <register type="NOA" address="0x00009888" value="0x0E778000" />
+        <register type="NOA" address="0x00009888" value="0x14778000" />
+        <register type="NOA" address="0x00009888" value="0x16778A80" />
+        <register type="NOA" address="0x00009888" value="0x18770002" />
+        <register type="NOA" address="0x00009888" value="0x02778000" />
+        <register type="NOA" address="0x00009888" value="0x04778000" />
+        <register type="NOA" address="0x00009888" value="0x06778000" />
+        <register type="NOA" address="0x00009888" value="0x08774000" />
+        <register type="NOA" address="0x00009888" value="0x04784000" />
+        <register type="NOA" address="0x00009888" value="0x0A7B0004" />
+        <register type="NOA" address="0x00009888" value="0x08EC0020" />
+        <register type="NOA" address="0x00009888" value="0x0CEC0020" />
+        <register type="NOA" address="0x00009888" value="0x00EC3600" />
+        <register type="NOA" address="0x00009888" value="0x1AEC0000" />
+        <register type="NOA" address="0x00009888" value="0x18EC0000" />
+        <register type="NOA" address="0x00009888" value="0x04F31000" />
+        <register type="NOA" address="0x00009888" value="0x06F31000" />
+        <register type="NOA" address="0x00009888" value="0x00F32000" />
+        <register type="NOA" address="0x00009888" value="0x14F78000" />
+        <register type="NOA" address="0x00009888" value="0x16F70800" />
+        <register type="NOA" address="0x00009888" value="0x02F78000" />
+        <register type="NOA" address="0x00009884" value="0x00000007" />
+        <register type="NOA" address="0x00009888" value="0x2100F000" />
+        <register type="NOA" address="0x00009888" value="0x1D000071" />
+        <register type="NOA" address="0x00009888" value="0x33000000" />
+        <register type="NOA" address="0x00009888" value="0x1100C000" />
+        <register type="NOA" address="0x00009888" value="0x1F00C000" />
+        <register type="NOA" address="0x00009888" value="0x2500C000" />
+        <register type="NOA" address="0x00009888" value="0x2700C000" />
+        <register type="NOA" address="0x00009888" value="0x2900C000" />
+        <register type="NOA" address="0x00009888" value="0x2D00C000" />
+        <register type="NOA" address="0x00009888" value="0x2F00C000" />
+        <register type="NOA" address="0x00009888" value="0x1300C000" />
+        <register type="NOA" address="0x00009888" value="0x1500C000" />
+        <register type="NOA" address="0x00009888" value="0x1700C000" />
+        <register type="NOA" address="0x00009888" value="0x1900C000" />
+        <register type="NOA" address="0x00009888" value="0x47000101" />
+        <register type="NOA" address="0x00009888" value="0x39000001" />
+        <register type="NOA" address="0x00009888" value="0x49001300" />
+        <register type="NOA" address="0x00009888" value="0x3D000021" />
+        <register type="NOA" address="0x00009888" value="0x4B001100" />
+        <register type="NOA" address="0x00009888" value="0x3F000420" />
+        <register type="NOA" address="0x00009888" value="0x4D001100" />
+        <register type="NOA" address="0x00009888" value="0x41000400" />
+        <register type="NOA" address="0x00009888" value="0x35000000" />
+        <register type="NOA" address="0x00009888" value="0x31000000" />
+        <register type="NOA" address="0x00009888" value="0x43000001" />
+        <register type="NOA" address="0x00009888" value="0x3B0000C7" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x70800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x20000801" />
+        <register type="OA" address="0x00002774" value="0x0111FEEE" />
+        <register type="OA" address="0x00002778" value="0x40001001" />
+        <register type="OA" address="0x0000277C" value="0x0222FDDD" />
+        <register type="OA" address="0x00002780" value="0x80002002" />
+        <register type="OA" address="0x00002784" value="0x0444FBBB" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+    </register_config>
+  </set>
+
+  <set name="Metric set L3_2"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="l3_2"
+       hw_config_guid="918834e2-a1a4-4d77-9f3a-0c229f8d803f"
+       chipset="CNL"
+       symbol_name="L3_2"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice1 L3 Bank1 Stalled"
+             description="The percentage of time in which slice1 L3 bank1 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l31_bank1_stalled"
+             units="percent"
+             symbol_name="L31Bank1Stalled"
+             availability="$SliceMask 2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Slice1 L3 Bank0 Stalled"
+             description="The percentage of time in which slice1 L3 bank0 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l31_bank0_stalled"
+             units="percent"
+             symbol_name="L31Bank0Stalled"
+             availability="$SliceMask 2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank2 Stalled"
+             description="The percentage of time in which slice0 L3 bank2 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank2_stalled"
+             units="percent"
+             symbol_name="L30Bank2Stalled"
+             availability="$SliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice1 L3 Bank2 Active"
+             description="The percentage of time in which slice1 L3 bank2 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l31_bank2_active"
+             units="percent"
+             symbol_name="L31Bank2Active"
+             availability="$SliceMask 2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="Slice1 L3 Bank1 Active"
+             description="The percentage of time in which slice1 L3 bank1 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l31_bank1_active"
+             units="percent"
+             symbol_name="L31Bank1Active"
+             availability="$SliceMask 2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice1 L3 Bank0 Active"
+             description="The percentage of time in which slice1 L3 bank0 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l31_bank0_active"
+             units="percent"
+             symbol_name="L31Bank0Active"
+             availability="$SliceMask 2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ A 31 READ UADD A 32 READ UADD 64 UMUL"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x106C0400" />
+        <register type="NOA" address="0x00009888" value="0x166C0000" />
+        <register type="NOA" address="0x00009888" value="0x16E1001A" />
+        <register type="NOA" address="0x00009888" value="0x16E5001A" />
+        <register type="NOA" address="0x00009888" value="0x16E9001A" />
+        <register type="NOA" address="0x00009888" value="0x10EC1C00" />
+        <register type="NOA" address="0x00009888" value="0x12EC0004" />
+        <register type="NOA" address="0x00009888" value="0x16EC001D" />
+        <register type="NOA" address="0x00009888" value="0x086C0020" />
+        <register type="NOA" address="0x00009888" value="0x0C6C0020" />
+        <register type="NOA" address="0x00009888" value="0x006C3600" />
+        <register type="NOA" address="0x00009888" value="0x186C0A88" />
+        <register type="NOA" address="0x00009888" value="0x1A6C0504" />
+        <register type="NOA" address="0x00009888" value="0x1C6C0005" />
+        <register type="NOA" address="0x00009888" value="0x0073F000" />
+        <register type="NOA" address="0x00009888" value="0x02739000" />
+        <register type="NOA" address="0x00009888" value="0x0473D000" />
+        <register type="NOA" address="0x00009888" value="0x0673D000" />
+        <register type="NOA" address="0x00009888" value="0x00778000" />
+        <register type="NOA" address="0x00009888" value="0x0E778000" />
+        <register type="NOA" address="0x00009888" value="0x14778000" />
+        <register type="NOA" address="0x00009888" value="0x16778A80" />
+        <register type="NOA" address="0x00009888" value="0x18770002" />
+        <register type="NOA" address="0x00009888" value="0x02778000" />
+        <register type="NOA" address="0x00009888" value="0x04778000" />
+        <register type="NOA" address="0x00009888" value="0x06778000" />
+        <register type="NOA" address="0x00009888" value="0x08778000" />
+        <register type="NOA" address="0x00009888" value="0x02E10024" />
+        <register type="NOA" address="0x00009888" value="0x10E10000" />
+        <register type="NOA" address="0x00009888" value="0x1EE10000" />
+        <register type="NOA" address="0x00009888" value="0x02E52400" />
+        <register type="NOA" address="0x00009888" value="0x10E50000" />
+        <register type="NOA" address="0x00009888" value="0x1EE50000" />
+        <register type="NOA" address="0x00009888" value="0x04E90024" />
+        <register type="NOA" address="0x00009888" value="0x10E90000" />
+        <register type="NOA" address="0x00009888" value="0x1EE90000" />
+        <register type="NOA" address="0x00009888" value="0x00EC0020" />
+        <register type="NOA" address="0x00009888" value="0x06EC2800" />
+        <register type="NOA" address="0x00009888" value="0x0AEC2820" />
+        <register type="NOA" address="0x00009888" value="0x0EEC3832" />
+        <register type="NOA" address="0x00009888" value="0x18EC0580" />
+        <register type="NOA" address="0x00009888" value="0x1AEC0000" />
+        <register type="NOA" address="0x00009888" value="0x1CEC0000" />
+        <register type="NOA" address="0x00009888" value="0x18ED8000" />
+        <register type="NOA" address="0x00009888" value="0x0AEE1000" />
+        <register type="NOA" address="0x00009888" value="0x00F3D000" />
+        <register type="NOA" address="0x00009888" value="0x02F38000" />
+        <register type="NOA" address="0x00009888" value="0x04F3C000" />
+        <register type="NOA" address="0x00009888" value="0x06F3C000" />
+        <register type="NOA" address="0x00009888" value="0x00F78000" />
+        <register type="NOA" address="0x00009888" value="0x0EF78000" />
+        <register type="NOA" address="0x00009888" value="0x16F78280" />
+        <register type="NOA" address="0x00009888" value="0x18F70002" />
+        <register type="NOA" address="0x00009888" value="0x04F78000" />
+        <register type="NOA" address="0x00009888" value="0x06F78000" />
+        <register type="NOA" address="0x00009888" value="0x08F74000" />
+        <register type="NOA" address="0x00009888" value="0x04F84000" />
+        <register type="NOA" address="0x00009888" value="0x0AFB0004" />
+        <register type="NOA" address="0x00009884" value="0x00000007" />
+        <register type="NOA" address="0x00009888" value="0x2100F000" />
+        <register type="NOA" address="0x00009888" value="0x1D000071" />
+        <register type="NOA" address="0x00009888" value="0x33000000" />
+        <register type="NOA" address="0x00009888" value="0x1100C000" />
+        <register type="NOA" address="0x00009888" value="0x1F00C000" />
+        <register type="NOA" address="0x00009888" value="0x2500C000" />
+        <register type="NOA" address="0x00009888" value="0x2700C000" />
+        <register type="NOA" address="0x00009888" value="0x2900C000" />
+        <register type="NOA" address="0x00009888" value="0x2D00C000" />
+        <register type="NOA" address="0x00009888" value="0x2F00C000" />
+        <register type="NOA" address="0x00009888" value="0x1300C000" />
+        <register type="NOA" address="0x00009888" value="0x1500C000" />
+        <register type="NOA" address="0x00009888" value="0x1700C000" />
+        <register type="NOA" address="0x00009888" value="0x1900C000" />
+        <register type="NOA" address="0x00009888" value="0x47000010" />
+        <register type="NOA" address="0x00009888" value="0x39000883" />
+        <register type="NOA" address="0x00009888" value="0x49000300" />
+        <register type="NOA" address="0x00009888" value="0x3D001064" />
+        <register type="NOA" address="0x00009888" value="0x4B000001" />
+        <register type="NOA" address="0x00009888" value="0x3F000C60" />
+        <register type="NOA" address="0x00009888" value="0x4D000001" />
+        <register type="NOA" address="0x00009888" value="0x41000C04" />
+        <register type="NOA" address="0x00009888" value="0x35000000" />
+        <register type="NOA" address="0x00009888" value="0x31000000" />
+        <register type="NOA" address="0x00009888" value="0x43000003" />
+        <register type="NOA" address="0x00009888" value="0x3B000001" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x70800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x20000801" />
+        <register type="OA" address="0x00002774" value="0x0111FEEE" />
+        <register type="OA" address="0x00002778" value="0x40001001" />
+        <register type="OA" address="0x0000277C" value="0x0222FDDD" />
+        <register type="OA" address="0x00002780" value="0x80002002" />
+        <register type="OA" address="0x00002784" value="0x0444FBBB" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+    </register_config>
+  </set>
+
+  <set name="Metric set RasterizerAndPixelBackend"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="rasterizer_and_pixel_backend"
+       hw_config_guid="2e95713a-c6d8-47a9-9207-eba3e208be51"
+       chipset="CNL"
+       symbol_name="RasterizerAndPixelBackend"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice1 Rasterizer Input Available"
+             description="The percentage of time in which slice1 rasterizer input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="rasterizer1_input_available"
+             units="percent"
+             symbol_name="Rasterizer1InputAvailable"
+             availability="$SliceMask 2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Slice0 Pixel Values Ready"
+             description="The percentage of time in which slice0 pixel values are ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="pixel_values0_ready"
+             units="percent"
+             symbol_name="PixelValues0Ready"
+             availability="$SliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="Slice0 Rasterizer Input Available"
+             description="The percentage of time in which slice0 rasterizer input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="rasterizer0_input_available"
+             units="percent"
+             symbol_name="Rasterizer0InputAvailable"
+             availability="$SliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Slice0 Post-EarlyZ Pixel Data Ready"
+             description="The percentage of time in which slice0 post-EarlyZ pixel data is ready (after early Z tests have been applied)"
+             data_type="float"
+             max_equation="100"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="pixel_data0_ready"
+             units="percent"
+             symbol_name="PixelData0Ready"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer/Early Depth Test"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice1 Pixel Values Ready"
+             description="The percentage of time in which slice1 pixel values are ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="pixel_values1_ready"
+             units="percent"
+             symbol_name="PixelValues1Ready"
+             availability="$SliceMask 2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Slice1 PS Output Available"
+             description="The percentage of time in which slice1 PS output is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_output1_available"
+             units="percent"
+             symbol_name="PSOutput1Available"
+             availability="$SliceMask 2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 Rasterizer Output Ready"
+             description="The percentage of time in which slice0 rasterizer output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="rasterizer0_output_ready"
+             units="percent"
+             symbol_name="Rasterizer0OutputReady"
+             availability="$SliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Slice1 Rasterizer Output Ready"
+             description="The percentage of time in which slice1 rasterizer output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="rasterizer1_output_ready"
+             units="percent"
+             symbol_name="Rasterizer1OutputReady"
+             availability="$SliceMask 2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Slice1 Post-EarlyZ Pixel Data Ready"
+             description="The percentage of time in which slice1 post-EarlyZ pixel data is ready (after early Z tests have been applied)"
+             data_type="float"
+             max_equation="100"
+             equation="B 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="pixel_data1_ready"
+             units="percent"
+             symbol_name="PixelData1Ready"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer/Early Depth Test"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ A 31 READ UADD A 32 READ UADD 64 UMUL"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 PS Output Available"
+             description="The percentage of time in which slice0 PS output is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_output0_available"
+             units="percent"
+             symbol_name="PSOutput0Available"
+             availability="$SliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x0C710004" />
+        <register type="NOA" address="0x00009888" value="0x10747000" />
+        <register type="NOA" address="0x00009888" value="0x12756800" />
+        <register type="NOA" address="0x00009888" value="0x04795000" />
+        <register type="NOA" address="0x00009888" value="0x127C01C0" />
+        <register type="NOA" address="0x00009888" value="0x0CF10004" />
+        <register type="NOA" address="0x00009888" value="0x10F47000" />
+        <register type="NOA" address="0x00009888" value="0x12F56800" />
+        <register type="NOA" address="0x00009888" value="0x04F95000" />
+        <register type="NOA" address="0x00009888" value="0x12FC01C0" />
+        <register type="NOA" address="0x00009888" value="0x1A6C4044" />
+        <register type="NOA" address="0x00009888" value="0x1C6C0004" />
+        <register type="NOA" address="0x00009888" value="0x186C00A0" />
+        <register type="NOA" address="0x00009888" value="0x00710010" />
+        <register type="NOA" address="0x00009888" value="0x02738000" />
+        <register type="NOA" address="0x00009888" value="0x04732000" />
+        <register type="NOA" address="0x00009888" value="0x0673A000" />
+        <register type="NOA" address="0x00009888" value="0x00736000" />
+        <register type="NOA" address="0x00009888" value="0x08740037" />
+        <register type="NOA" address="0x00009888" value="0x0C740000" />
+        <register type="NOA" address="0x00009888" value="0x0A750F36" />
+        <register type="NOA" address="0x00009888" value="0x10750000" />
+        <register type="NOA" address="0x00009888" value="0x04751000" />
+        <register type="NOA" address="0x00009888" value="0x0C752000" />
+        <register type="NOA" address="0x00009888" value="0x0E750000" />
+        <register type="NOA" address="0x00009888" value="0x0C760800" />
+        <register type="NOA" address="0x00009888" value="0x0E768800" />
+        <register type="NOA" address="0x00009888" value="0x10760002" />
+        <register type="NOA" address="0x00009888" value="0x0077C000" />
+        <register type="NOA" address="0x00009888" value="0x0E778000" />
+        <register type="NOA" address="0x00009888" value="0x1477C000" />
+        <register type="NOA" address="0x00009888" value="0x167767E0" />
+        <register type="NOA" address="0x00009888" value="0x18770002" />
+        <register type="NOA" address="0x00009888" value="0x02778000" />
+        <register type="NOA" address="0x00009888" value="0x04778000" />
+        <register type="NOA" address="0x00009888" value="0x0C790017" />
+        <register type="NOA" address="0x00009888" value="0x08790000" />
+        <register type="NOA" address="0x00009888" value="0x0C7B0088" />
+        <register type="NOA" address="0x00009888" value="0x0E7C0032" />
+        <register type="NOA" address="0x00009888" value="0x107C0000" />
+        <register type="NOA" address="0x00009888" value="0x167C0004" />
+        <register type="NOA" address="0x00009888" value="0x04F10200" />
+        <register type="NOA" address="0x00009888" value="0x00F10000" />
+        <register type="NOA" address="0x00009888" value="0x08F40DC0" />
+        <register type="NOA" address="0x00009888" value="0x0CF40000" />
+        <register type="NOA" address="0x00009888" value="0x00F50D80" />
+        <register type="NOA" address="0x00009888" value="0x02F5003C" />
+        <register type="NOA" address="0x00009888" value="0x10F50000" />
+        <register type="NOA" address="0x00009888" value="0x0AF54000" />
+        <register type="NOA" address="0x00009888" value="0x0CF58000" />
+        <register type="NOA" address="0x00009888" value="0x04F50000" />
+        <register type="NOA" address="0x00009888" value="0x06F50000" />
+        <register type="NOA" address="0x00009888" value="0x0EF62200" />
+        <register type="NOA" address="0x00009888" value="0x0CF6A000" />
+        <register type="NOA" address="0x00009888" value="0x0EF7C000" />
+        <register type="NOA" address="0x00009888" value="0x16F71030" />
+        <register type="NOA" address="0x00009888" value="0x18F70001" />
+        <register type="NOA" address="0x00009888" value="0x02F7C000" />
+        <register type="NOA" address="0x00009888" value="0x04F7C000" />
+        <register type="NOA" address="0x00009888" value="0x0CF905C0" />
+        <register type="NOA" address="0x00009888" value="0x08F90000" />
+        <register type="NOA" address="0x00009888" value="0x0CFB0220" />
+        <register type="NOA" address="0x00009888" value="0x0EFC1900" />
+        <register type="NOA" address="0x00009888" value="0x10FC0000" />
+        <register type="NOA" address="0x00009888" value="0x16FC0010" />
+        <register type="NOA" address="0x00009884" value="0x00000007" />
+        <register type="NOA" address="0x00009888" value="0x2100F000" />
+        <register type="NOA" address="0x00009888" value="0x1D000071" />
+        <register type="NOA" address="0x00009888" value="0x33000000" />
+        <register type="NOA" address="0x00009888" value="0x1100C000" />
+        <register type="NOA" address="0x00009888" value="0x1F00C000" />
+        <register type="NOA" address="0x00009888" value="0x2300C000" />
+        <register type="NOA" address="0x00009888" value="0x2500C000" />
+        <register type="NOA" address="0x00009888" value="0x2700C000" />
+        <register type="NOA" address="0x00009888" value="0x2900C000" />
+        <register type="NOA" address="0x00009888" value="0x2B00C000" />
+        <register type="NOA" address="0x00009888" value="0x2D00C000" />
+        <register type="NOA" address="0x00009888" value="0x2F00C000" />
+        <register type="NOA" address="0x00009888" value="0x1300C000" />
+        <register type="NOA" address="0x00009888" value="0x1500C000" />
+        <register type="NOA" address="0x00009888" value="0x47000001" />
+        <register type="NOA" address="0x00009888" value="0x39000421" />
+        <register type="NOA" address="0x00009888" value="0x49000300" />
+        <register type="NOA" address="0x00009888" value="0x3D000402" />
+        <register type="NOA" address="0x00009888" value="0x4B001101" />
+        <register type="NOA" address="0x00009888" value="0x3F000840" />
+        <register type="NOA" address="0x00009888" value="0x4D000101" />
+        <register type="NOA" address="0x00009888" value="0x41000801" />
+        <register type="NOA" address="0x00009888" value="0x35000000" />
+        <register type="NOA" address="0x00009888" value="0x31000000" />
+        <register type="NOA" address="0x00009888" value="0x43000001" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x30800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x30800000" />
+        <register type="OA" address="0x00002770" value="0x00000180" />
+        <register type="OA" address="0x00002774" value="0x0000FFCF" />
+        <register type="OA" address="0x00002778" value="0x00006000" />
+        <register type="OA" address="0x0000277C" value="0x0000F3FF" />
+        <register type="OA" address="0x00002790" value="0x00000002" />
+        <register type="OA" address="0x00002794" value="0x0000FFFE" />
+        <register type="OA" address="0x00002798" value="0x00000002" />
+        <register type="OA" address="0x0000279C" value="0x0000FFFD" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+    </register_config>
+  </set>
+
+  <set name="Metric set Sampler"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="sampler"
+       hw_config_guid="9bcf4ff2-c15f-4bea-8ec8-8db87791942e"
+       chipset="CNL"
+       symbol_name="Sampler"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 Subslice2 Input Available"
+             description="The percentage of time in which slice0 subslice2 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler02_input_available"
+             units="percent"
+             symbol_name="Sampler02InputAvailable"
+             availability="$SubsliceMask 4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="C 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 Subslice0 Input Available"
+             description="The percentage of time in which slice0 subslice0 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler00_input_available"
+             units="percent"
+             symbol_name="Sampler00InputAvailable"
+             availability="$SubsliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Slice1 Subslice0 Input Available"
+             description="The percentage of time in which slice1 subslice0 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler10_input_available"
+             units="percent"
+             symbol_name="Sampler10InputAvailable"
+             availability="$SubsliceMask 8 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="Slice0 Subslice2 Sampler Output Ready"
+             description="The percentage of time in which slice0 subslice2 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler02_output_ready"
+             units="percent"
+             symbol_name="Sampler02OutputReady"
+             availability="$SubsliceMask 4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Slice0 Subslice1 Input Available"
+             description="The percentage of time in which slice0 subslice1 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler01_input_available"
+             units="percent"
+             symbol_name="Sampler01InputAvailable"
+             availability="$SubsliceMask 2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice1 Subslice1 Input Available"
+             description="The percentage of time in which slice1 subslice1 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler11_input_available"
+             units="percent"
+             symbol_name="Sampler11InputAvailable"
+             availability="$SubsliceMask 16 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Slice0 Subslice0 Sampler Output Ready"
+             description="The percentage of time in which slice0 subslice0 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler00_output_ready"
+             units="percent"
+             symbol_name="Sampler00OutputReady"
+             availability="$SubsliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Slice1 Subslice0 Sampler Output Ready"
+             description="The percentage of time in which slice1 subslice0 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler10_output_ready"
+             units="percent"
+             symbol_name="Sampler10OutputReady"
+             availability="$SubsliceMask 8 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Slice0 Subslice1 Sampler Output Ready"
+             description="The percentage of time in which slice0 subslice1 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler01_output_ready"
+             units="percent"
+             symbol_name="Sampler01OutputReady"
+             availability="$SubsliceMask 2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Slice1 Subslice1 Sampler Output Ready"
+             description="The percentage of time in which slice1 subslice1 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler11_output_ready"
+             units="percent"
+             symbol_name="Sampler11OutputReady"
+             availability="$SubsliceMask 16 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ A 31 READ UADD A 32 READ UADD 64 UMUL"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x14141400" />
+        <register type="NOA" address="0x00009888" value="0x1614000B" />
+        <register type="NOA" address="0x00009888" value="0x14161400" />
+        <register type="NOA" address="0x00009888" value="0x14341400" />
+        <register type="NOA" address="0x00009888" value="0x1634000B" />
+        <register type="NOA" address="0x00009888" value="0x14361400" />
+        <register type="NOA" address="0x00009888" value="0x14941400" />
+        <register type="NOA" address="0x00009888" value="0x1694000B" />
+        <register type="NOA" address="0x00009888" value="0x14961400" />
+        <register type="NOA" address="0x00009888" value="0x14B41400" />
+        <register type="NOA" address="0x00009888" value="0x16B4000B" />
+        <register type="NOA" address="0x00009888" value="0x14B61400" />
+        <register type="NOA" address="0x00009888" value="0x14541400" />
+        <register type="NOA" address="0x00009888" value="0x1654000B" />
+        <register type="NOA" address="0x00009888" value="0x14561400" />
+        <register type="NOA" address="0x00009888" value="0x1A6C5000" />
+        <register type="NOA" address="0x00009888" value="0x1C6C0005" />
+        <register type="NOA" address="0x00009888" value="0x186C0280" />
+        <register type="NOA" address="0x00009888" value="0x0673F000" />
+        <register type="NOA" address="0x00009888" value="0x0073C000" />
+        <register type="NOA" address="0x00009888" value="0x04742000" />
+        <register type="NOA" address="0x00009888" value="0x0A74A000" />
+        <register type="NOA" address="0x00009888" value="0x04752000" />
+        <register type="NOA" address="0x00009888" value="0x0A75A000" />
+        <register type="NOA" address="0x00009888" value="0x0C760800" />
+        <register type="NOA" address="0x00009888" value="0x0E760280" />
+        <register type="NOA" address="0x00009888" value="0x0077C000" />
+        <register type="NOA" address="0x00009888" value="0x0E77C000" />
+        <register type="NOA" address="0x00009888" value="0x14774000" />
+        <register type="NOA" address="0x00009888" value="0x1677A950" />
+        <register type="NOA" address="0x00009888" value="0x18770002" />
+        <register type="NOA" address="0x00009888" value="0x04778000" />
+        <register type="NOA" address="0x00009888" value="0x06778000" />
+        <register type="NOA" address="0x00009888" value="0x08774000" />
+        <register type="NOA" address="0x00009888" value="0x0A774000" />
+        <register type="NOA" address="0x00009888" value="0x0C77C000" />
+        <register type="NOA" address="0x00009888" value="0x0A7BA828" />
+        <register type="NOA" address="0x00009888" value="0x0C7B0002" />
+        <register type="NOA" address="0x00009888" value="0x147CE800" />
+        <register type="NOA" address="0x00009888" value="0x167C0003" />
+        <register type="NOA" address="0x00009888" value="0x087CC000" />
+        <register type="NOA" address="0x00009888" value="0x0A7C8000" />
+        <register type="NOA" address="0x00009888" value="0x1C7D8200" />
+        <register type="NOA" address="0x00009888" value="0x1E7D0002" />
+        <register type="NOA" address="0x00009888" value="0x00194000" />
+        <register type="NOA" address="0x00009888" value="0x0E194000" />
+        <register type="NOA" address="0x00009888" value="0x0C194000" />
+        <register type="NOA" address="0x00009888" value="0x00140050" />
+        <register type="NOA" address="0x00009888" value="0x06145800" />
+        <register type="NOA" address="0x00009888" value="0x10140000" />
+        <register type="NOA" address="0x00009888" value="0x18140000" />
+        <register type="NOA" address="0x00009888" value="0x1C140080" />
+        <register type="NOA" address="0x00009888" value="0x0A150001" />
+        <register type="NOA" address="0x00009888" value="0x06160043" />
+        <register type="NOA" address="0x00009888" value="0x10160000" />
+        <register type="NOA" address="0x00009888" value="0x0C160000" />
+        <register type="NOA" address="0x00009888" value="0x1A3900A0" />
+        <register type="NOA" address="0x00009888" value="0x0A394000" />
+        <register type="NOA" address="0x00009888" value="0x08345850" />
+        <register type="NOA" address="0x00009888" value="0x10340000" />
+        <register type="NOA" address="0x00009888" value="0x1C340020" />
+        <register type="NOA" address="0x00009888" value="0x08358000" />
+        <register type="NOA" address="0x00009888" value="0x04362180" />
+        <register type="NOA" address="0x00009888" value="0x10360000" />
+        <register type="NOA" address="0x00009888" value="0x0A360000" />
+        <register type="NOA" address="0x00009888" value="0x12F40140" />
+        <register type="NOA" address="0x00009888" value="0x06F48000" />
+        <register type="NOA" address="0x00009888" value="0x14F5000A" />
+        <register type="NOA" address="0x00009888" value="0x06F58000" />
+        <register type="NOA" address="0x00009888" value="0x10F60028" />
+        <register type="NOA" address="0x00009888" value="0x0EF60002" />
+        <register type="NOA" address="0x00009888" value="0x16F77C00" />
+        <register type="NOA" address="0x00009888" value="0x18F70001" />
+        <register type="NOA" address="0x00009888" value="0x04F74000" />
+        <register type="NOA" address="0x00009888" value="0x06F7C000" />
+        <register type="NOA" address="0x00009888" value="0x0CFB0280" />
+        <register type="NOA" address="0x00009888" value="0x08FB8000" />
+        <register type="NOA" address="0x00009888" value="0x16FC0280" />
+        <register type="NOA" address="0x00009888" value="0x04FC8000" />
+        <register type="NOA" address="0x00009888" value="0x1EFD2800" />
+        <register type="NOA" address="0x00009888" value="0x1CFD0008" />
+        <register type="NOA" address="0x00009888" value="0x1A992000" />
+        <register type="NOA" address="0x00009888" value="0x1C990001" />
+        <register type="NOA" address="0x00009888" value="0x06994000" />
+        <register type="NOA" address="0x00009888" value="0x0C945850" />
+        <register type="NOA" address="0x00009888" value="0x10940000" />
+        <register type="NOA" address="0x00009888" value="0x1E940000" />
+        <register type="NOA" address="0x00009888" value="0x1C940002" />
+        <register type="NOA" address="0x00009888" value="0x08952000" />
+        <register type="NOA" address="0x00009888" value="0x02962180" />
+        <register type="NOA" address="0x00009888" value="0x10960000" />
+        <register type="NOA" address="0x00009888" value="0x06960000" />
+        <register type="NOA" address="0x00009888" value="0x1CB90014" />
+        <register type="NOA" address="0x00009888" value="0x04B94000" />
+        <register type="NOA" address="0x00009888" value="0x0EB45850" />
+        <register type="NOA" address="0x00009888" value="0x10B40000" />
+        <register type="NOA" address="0x00009888" value="0x1EB40000" />
+        <register type="NOA" address="0x00009888" value="0x1AB48000" />
+        <register type="NOA" address="0x00009888" value="0x08B51000" />
+        <register type="NOA" address="0x00009888" value="0x02B60043" />
+        <register type="NOA" address="0x00009888" value="0x10B60000" />
+        <register type="NOA" address="0x00009888" value="0x04B60000" />
+        <register type="NOA" address="0x00009888" value="0x1A590A00" />
+        <register type="NOA" address="0x00009888" value="0x08594000" />
+        <register type="NOA" address="0x00009888" value="0x0A545850" />
+        <register type="NOA" address="0x00009888" value="0x10540000" />
+        <register type="NOA" address="0x00009888" value="0x1C540008" />
+        <register type="NOA" address="0x00009888" value="0x1E540000" />
+        <register type="NOA" address="0x00009888" value="0x08554000" />
+        <register type="NOA" address="0x00009888" value="0x04560043" />
+        <register type="NOA" address="0x00009888" value="0x10560000" />
+        <register type="NOA" address="0x00009888" value="0x08560000" />
+        <register type="NOA" address="0x00009884" value="0x00000007" />
+        <register type="NOA" address="0x00009888" value="0x2100F000" />
+        <register type="NOA" address="0x00009888" value="0x13000071" />
+        <register type="NOA" address="0x00009888" value="0x33000000" />
+        <register type="NOA" address="0x00009888" value="0x1100C000" />
+        <register type="NOA" address="0x00009888" value="0x1F00C000" />
+        <register type="NOA" address="0x00009888" value="0x2300C000" />
+        <register type="NOA" address="0x00009888" value="0x2500C000" />
+        <register type="NOA" address="0x00009888" value="0x2700C000" />
+        <register type="NOA" address="0x00009888" value="0x2900C000" />
+        <register type="NOA" address="0x00009888" value="0x2B00C000" />
+        <register type="NOA" address="0x00009888" value="0x2D00C000" />
+        <register type="NOA" address="0x00009888" value="0x2F00C000" />
+        <register type="NOA" address="0x00009888" value="0x1500C000" />
+        <register type="NOA" address="0x00009888" value="0x1700C000" />
+        <register type="NOA" address="0x00009888" value="0x1900C000" />
+        <register type="NOA" address="0x00009888" value="0x1B00C000" />
+        <register type="NOA" address="0x00009888" value="0x1D00C000" />
+        <register type="NOA" address="0x00009888" value="0x47000031" />
+        <register type="NOA" address="0x00009888" value="0x39000143" />
+        <register type="NOA" address="0x00009888" value="0x49001110" />
+        <register type="NOA" address="0x00009888" value="0x3D000C61" />
+        <register type="NOA" address="0x00009888" value="0x4B000011" />
+        <register type="NOA" address="0x00009888" value="0x3F0018C3" />
+        <register type="NOA" address="0x00009888" value="0x4D000000" />
+        <register type="NOA" address="0x00009888" value="0x41000842" />
+        <register type="NOA" address="0x00009888" value="0x35000000" />
+        <register type="NOA" address="0x00009888" value="0x31000000" />
+        <register type="NOA" address="0x00009888" value="0x43000002" />
+        <register type="NOA" address="0x00009888" value="0x3B000480" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x10800000" />
+        <register type="OA" address="0x00002770" value="0x00000018" />
+        <register type="OA" address="0x00002774" value="0x0000FFFC" />
+        <register type="OA" address="0x00002778" value="0x00000060" />
+        <register type="OA" address="0x0000277C" value="0x0000FFF3" />
+        <register type="OA" address="0x00002780" value="0x00000180" />
+        <register type="OA" address="0x00002784" value="0x0000FFCF" />
+        <register type="OA" address="0x00002788" value="0x00000600" />
+        <register type="OA" address="0x0000278C" value="0x0000FF3F" />
+        <register type="OA" address="0x00002790" value="0x00001800" />
+        <register type="OA" address="0x00002794" value="0x0000FCFF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+    </register_config>
+  </set>
+
+  <set name="Metric set TDL_1"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="tdl_1"
+       hw_config_guid="c46c7bb5-f26d-4634-b491-902394af85b1"
+       chipset="CNL"
+       symbol_name="TDL_1"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice1 Subslice1"
+             description="The percentage of time in which PS thread is ready for dispatch on slice1 subslice1 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread11_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread11ReadyForDispatch"
+             availability="$SubsliceMask 16 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="NonPS Thread Ready For Dispatch on Slice0 Subslice2"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice2 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="1  C 4 READ $GpuCoreClocks FDIV FSUB"
+             underscore_name="non_ps_thread02_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread02ReadyForDispatch"
+             availability="$SubsliceMask 4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="NonPS Thread Ready For Dispatch on Slice1 Subslice0"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice1 subslice0 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="1  C 5 READ $GpuCoreClocks FDIV FSUB"
+             underscore_name="non_ps_thread10_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread10ReadyForDispatch"
+             availability="$SubsliceMask 8 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="NonPS Thread Ready For Dispatch on Slice0 Subslice0"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice0 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="1  C 2 READ $GpuCoreClocks FDIV FSUB"
+             underscore_name="non_ps_thread00_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread00ReadyForDispatch"
+             availability="$SubsliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Subslice0"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice0 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread00_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread00ReadyForDispatch"
+             availability="$SubsliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Subslice1"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice1 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread01_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread01ReadyForDispatch"
+             availability="$SubsliceMask 2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice1 Subslice0"
+             description="The percentage of time in which PS thread is ready for dispatch on slice1 subslice0 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread10_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread10ReadyForDispatch"
+             availability="$SubsliceMask 8 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="NonPS Thread Ready For Dispatch on Slice1 Subslice1"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice1 subslice1 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="1  C 6 READ $GpuCoreClocks FDIV FSUB"
+             underscore_name="non_ps_thread11_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread11ReadyForDispatch"
+             availability="$SubsliceMask 16 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Subslice2"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice2 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread02_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread02ReadyForDispatch"
+             availability="$SubsliceMask 4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ A 31 READ UADD A 32 READ UADD 64 UMUL"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="NonPS Thread Ready For Dispatch on Slice0 Subslice1"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice1 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="1  C 3 READ $GpuCoreClocks FDIV FSUB"
+             underscore_name="non_ps_thread01_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread01ReadyForDispatch"
+             availability="$SubsliceMask 2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x12180000" />
+        <register type="NOA" address="0x00009888" value="0x12380000" />
+        <register type="NOA" address="0x00009888" value="0x12980000" />
+        <register type="NOA" address="0x00009888" value="0x12B80000" />
+        <register type="NOA" address="0x00009888" value="0x12580000" />
+        <register type="NOA" address="0x00009888" value="0x1A6C5000" />
+        <register type="NOA" address="0x00009888" value="0x1C6C0005" />
+        <register type="NOA" address="0x00009888" value="0x186C2800" />
+        <register type="NOA" address="0x00009888" value="0x0673F000" />
+        <register type="NOA" address="0x00009888" value="0x02733000" />
+        <register type="NOA" address="0x00009888" value="0x0474A000" />
+        <register type="NOA" address="0x00009888" value="0x0A748000" />
+        <register type="NOA" address="0x00009888" value="0x0475A000" />
+        <register type="NOA" address="0x00009888" value="0x0A758000" />
+        <register type="NOA" address="0x00009888" value="0x0C762800" />
+        <register type="NOA" address="0x00009888" value="0x0E760200" />
+        <register type="NOA" address="0x00009888" value="0x0077C000" />
+        <register type="NOA" address="0x00009888" value="0x0E77C000" />
+        <register type="NOA" address="0x00009888" value="0x14774000" />
+        <register type="NOA" address="0x00009888" value="0x1677A950" />
+        <register type="NOA" address="0x00009888" value="0x18770002" />
+        <register type="NOA" address="0x00009888" value="0x0277C000" />
+        <register type="NOA" address="0x00009888" value="0x04774000" />
+        <register type="NOA" address="0x00009888" value="0x06774000" />
+        <register type="NOA" address="0x00009888" value="0x08778000" />
+        <register type="NOA" address="0x00009888" value="0x0A778000" />
+        <register type="NOA" address="0x00009888" value="0x0A7BA802" />
+        <register type="NOA" address="0x00009888" value="0x0C7B0002" />
+        <register type="NOA" address="0x00009888" value="0x087B8000" />
+        <register type="NOA" address="0x00009888" value="0x147CE800" />
+        <register type="NOA" address="0x00009888" value="0x167C0003" />
+        <register type="NOA" address="0x00009888" value="0x047C8000" />
+        <register type="NOA" address="0x00009888" value="0x067CC000" />
+        <register type="NOA" address="0x00009888" value="0x1C7D8008" />
+        <register type="NOA" address="0x00009888" value="0x1E7D0002" />
+        <register type="NOA" address="0x00009888" value="0x00194000" />
+        <register type="NOA" address="0x00009888" value="0x0E194000" />
+        <register type="NOA" address="0x00009888" value="0x02194000" />
+        <register type="NOA" address="0x00009888" value="0x18148000" />
+        <register type="NOA" address="0x00009888" value="0x1C140200" />
+        <register type="NOA" address="0x00009888" value="0x1A142000" />
+        <register type="NOA" address="0x00009888" value="0x0015C000" />
+        <register type="NOA" address="0x00009888" value="0x0A150002" />
+        <register type="NOA" address="0x00009888" value="0x00168000" />
+        <register type="NOA" address="0x00009888" value="0x0E168000" />
+        <register type="NOA" address="0x00009888" value="0x02168000" />
+        <register type="NOA" address="0x00009888" value="0x0018A1A3" />
+        <register type="NOA" address="0x00009888" value="0x0618A500" />
+        <register type="NOA" address="0x00009888" value="0x10180000" />
+        <register type="NOA" address="0x00009888" value="0x1A3900A0" />
+        <register type="NOA" address="0x00009888" value="0x04394000" />
+        <register type="NOA" address="0x00009888" value="0x1C342800" />
+        <register type="NOA" address="0x00009888" value="0x1A348000" />
+        <register type="NOA" address="0x00009888" value="0x0A35000C" />
+        <register type="NOA" address="0x00009888" value="0x08351000" />
+        <register type="NOA" address="0x00009888" value="0x1A360140" />
+        <register type="NOA" address="0x00009888" value="0x04368000" />
+        <register type="NOA" address="0x00009888" value="0x0838A5A3" />
+        <register type="NOA" address="0x00009888" value="0x023800A1" />
+        <register type="NOA" address="0x00009888" value="0x10380000" />
+        <register type="NOA" address="0x00009888" value="0x12F40140" />
+        <register type="NOA" address="0x00009888" value="0x08F42000" />
+        <register type="NOA" address="0x00009888" value="0x14F5000A" />
+        <register type="NOA" address="0x00009888" value="0x08F52000" />
+        <register type="NOA" address="0x00009888" value="0x10F60028" />
+        <register type="NOA" address="0x00009888" value="0x0EF60008" />
+        <register type="NOA" address="0x00009888" value="0x16F77C00" />
+        <register type="NOA" address="0x00009888" value="0x18F70001" />
+        <register type="NOA" address="0x00009888" value="0x08F7C000" />
+        <register type="NOA" address="0x00009888" value="0x0AF74000" />
+        <register type="NOA" address="0x00009888" value="0x0CFB0280" />
+        <register type="NOA" address="0x00009888" value="0x0AFB0020" />
+        <register type="NOA" address="0x00009888" value="0x16FC0280" />
+        <register type="NOA" address="0x00009888" value="0x0AFC8000" />
+        <register type="NOA" address="0x00009888" value="0x1EFD2800" />
+        <register type="NOA" address="0x00009888" value="0x1CFD0200" />
+        <register type="NOA" address="0x00009888" value="0x1A992000" />
+        <register type="NOA" address="0x00009888" value="0x1C990001" />
+        <register type="NOA" address="0x00009888" value="0x08994000" />
+        <register type="NOA" address="0x00009888" value="0x1E940028" />
+        <register type="NOA" address="0x00009888" value="0x1C940008" />
+        <register type="NOA" address="0x00009888" value="0x0A9500C0" />
+        <register type="NOA" address="0x00009888" value="0x08954000" />
+        <register type="NOA" address="0x00009888" value="0x1A964000" />
+        <register type="NOA" address="0x00009888" value="0x1C960002" />
+        <register type="NOA" address="0x00009888" value="0x08968000" />
+        <register type="NOA" address="0x00009888" value="0x0C98A5A3" />
+        <register type="NOA" address="0x00009888" value="0x049800A1" />
+        <register type="NOA" address="0x00009888" value="0x10980000" />
+        <register type="NOA" address="0x00009888" value="0x1CB90014" />
+        <register type="NOA" address="0x00009888" value="0x0AB94000" />
+        <register type="NOA" address="0x00009888" value="0x1EB40280" />
+        <register type="NOA" address="0x00009888" value="0x1CB40020" />
+        <register type="NOA" address="0x00009888" value="0x0AB50300" />
+        <register type="NOA" address="0x00009888" value="0x08B58000" />
+        <register type="NOA" address="0x00009888" value="0x1CB60028" />
+        <register type="NOA" address="0x00009888" value="0x0AB68000" />
+        <register type="NOA" address="0x00009888" value="0x0EB8A5A3" />
+        <register type="NOA" address="0x00009888" value="0x04B8A100" />
+        <register type="NOA" address="0x00009888" value="0x10B80000" />
+        <register type="NOA" address="0x00009888" value="0x1A590A00" />
+        <register type="NOA" address="0x00009888" value="0x06594000" />
+        <register type="NOA" address="0x00009888" value="0x1C548002" />
+        <register type="NOA" address="0x00009888" value="0x1E540002" />
+        <register type="NOA" address="0x00009888" value="0x0A550030" />
+        <register type="NOA" address="0x00009888" value="0x08552000" />
+        <register type="NOA" address="0x00009888" value="0x1A561400" />
+        <register type="NOA" address="0x00009888" value="0x06568000" />
+        <register type="NOA" address="0x00009888" value="0x0A58A5A3" />
+        <register type="NOA" address="0x00009888" value="0x0258A100" />
+        <register type="NOA" address="0x00009888" value="0x10580000" />
+        <register type="NOA" address="0x00009884" value="0x00000007" />
+        <register type="NOA" address="0x00009888" value="0x2100F000" />
+        <register type="NOA" address="0x00009888" value="0x1D000071" />
+        <register type="NOA" address="0x00009888" value="0x33000000" />
+        <register type="NOA" address="0x00009888" value="0x1100C000" />
+        <register type="NOA" address="0x00009888" value="0x1F00C000" />
+        <register type="NOA" address="0x00009888" value="0x2300C000" />
+        <register type="NOA" address="0x00009888" value="0x2500C000" />
+        <register type="NOA" address="0x00009888" value="0x2700C000" />
+        <register type="NOA" address="0x00009888" value="0x2900C000" />
+        <register type="NOA" address="0x00009888" value="0x2B00C000" />
+        <register type="NOA" address="0x00009888" value="0x2D00C000" />
+        <register type="NOA" address="0x00009888" value="0x2F00C000" />
+        <register type="NOA" address="0x00009888" value="0x1300C000" />
+        <register type="NOA" address="0x00009888" value="0x1500C000" />
+        <register type="NOA" address="0x00009888" value="0x1700C000" />
+        <register type="NOA" address="0x00009888" value="0x1900C000" />
+        <register type="NOA" address="0x00009888" value="0x1B00C000" />
+        <register type="NOA" address="0x00009888" value="0x47000111" />
+        <register type="NOA" address="0x00009888" value="0x39000421" />
+        <register type="NOA" address="0x00009888" value="0x49001300" />
+        <register type="NOA" address="0x00009888" value="0x3D00042B" />
+        <register type="NOA" address="0x00009888" value="0x4B000011" />
+        <register type="NOA" address="0x00009888" value="0x3F001081" />
+        <register type="NOA" address="0x00009888" value="0x4D000000" />
+        <register type="NOA" address="0x00009888" value="0x41000000" />
+        <register type="NOA" address="0x00009888" value="0x35000000" />
+        <register type="NOA" address="0x00009888" value="0x31000000" />
+        <register type="NOA" address="0x00009888" value="0x43000000" />
+        <register type="NOA" address="0x00009888" value="0x3B000004" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x10800000" />
+        <register type="OA" address="0x00002770" value="0x00000000" />
+        <register type="OA" address="0x00002774" value="0x0000FFFC" />
+        <register type="OA" address="0x00002778" value="0x00000000" />
+        <register type="OA" address="0x0000277C" value="0x0000FFF3" />
+        <register type="OA" address="0x00002780" value="0x00000000" />
+        <register type="OA" address="0x00002784" value="0x0000FFCF" />
+        <register type="OA" address="0x00002788" value="0x00000000" />
+        <register type="OA" address="0x0000278C" value="0x0000FF3F" />
+        <register type="OA" address="0x00002790" value="0x00000000" />
+        <register type="OA" address="0x00002794" value="0x0000FCFF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+    </register_config>
+  </set>
+
+  <set name="Metric set TDL_2"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="tdl_2"
+       hw_config_guid="aa2d6ab4-99b3-42f8-94d6-4a9aa2baedaf"
+       chipset="CNL"
+       symbol_name="TDL_2"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Thread Header Ready on Slice1 Subslice1 Port 1"
+             description="The percentage of time in which thread header is ready on slice1 subslice1 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header11_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader11ReadyPort1"
+             availability="$SubsliceMask 16 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice1 Port 0"
+             description="The percentage of time in which thread header is ready on slice0 subslice1 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header01_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader01ReadyPort0"
+             availability="$SubsliceMask 2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice1 Port 1"
+             description="The percentage of time in which thread header is ready on slice0 subslice1 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header01_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader01ReadyPort1"
+             availability="$SubsliceMask 2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="B 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Thread Header Ready on Slice1 Subslice1 Port 0"
+             description="The percentage of time in which thread header is ready on slice1 subslice1 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header11_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader11ReadyPort0"
+             availability="$SubsliceMask 16 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice2 Port 1"
+             description="The percentage of time in which thread header is ready on slice0 subslice2 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header02_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader02ReadyPort1"
+             availability="$SubsliceMask 4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice2 Port 0"
+             description="The percentage of time in which thread header is ready on slice0 subslice2 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header02_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader02ReadyPort0"
+             availability="$SubsliceMask 4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Thread Header Ready on Slice1 Subslice0 Port 1"
+             description="The percentage of time in which thread header is ready on slice1 subslice0 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header10_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader10ReadyPort1"
+             availability="$SubsliceMask 8 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ A 31 READ UADD A 32 READ UADD 64 UMUL"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Thread Header Ready on Slice1 Subslice0 Port 0"
+             description="The percentage of time in which thread header is ready on slice1 subslice0 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header10_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader10ReadyPort0"
+             availability="$SubsliceMask 8 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice0 Port 0"
+             description="The percentage of time in which thread header is ready on slice0 subslice0 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="B 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header00_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader00ReadyPort0"
+             availability="$SubsliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice0 Port 1"
+             description="The percentage of time in which thread header is ready on slice0 subslice0 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="B 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header00_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader00ReadyPort1"
+             availability="$SubsliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x12184D60" />
+        <register type="NOA" address="0x00009888" value="0x12384D60" />
+        <register type="NOA" address="0x00009888" value="0x12984D60" />
+        <register type="NOA" address="0x00009888" value="0x12B84D60" />
+        <register type="NOA" address="0x00009888" value="0x12584D60" />
+        <register type="NOA" address="0x00009888" value="0x186C2A00" />
+        <register type="NOA" address="0x00009888" value="0x1A6C0001" />
+        <register type="NOA" address="0x00009888" value="0x00738000" />
+        <register type="NOA" address="0x00009888" value="0x02737000" />
+        <register type="NOA" address="0x00009888" value="0x12740140" />
+        <register type="NOA" address="0x00009888" value="0x1475000A" />
+        <register type="NOA" address="0x00009888" value="0x10760028" />
+        <register type="NOA" address="0x00009888" value="0x16777C00" />
+        <register type="NOA" address="0x00009888" value="0x18770001" />
+        <register type="NOA" address="0x00009888" value="0x02774000" />
+        <register type="NOA" address="0x00009888" value="0x04774000" />
+        <register type="NOA" address="0x00009888" value="0x06778000" />
+        <register type="NOA" address="0x00009888" value="0x08778000" />
+        <register type="NOA" address="0x00009888" value="0x0A778000" />
+        <register type="NOA" address="0x00009888" value="0x0C778000" />
+        <register type="NOA" address="0x00009888" value="0x0C7B0280" />
+        <register type="NOA" address="0x00009888" value="0x087BA000" />
+        <register type="NOA" address="0x00009888" value="0x167C0280" />
+        <register type="NOA" address="0x00009888" value="0x027CC000" />
+        <register type="NOA" address="0x00009888" value="0x047CC000" />
+        <register type="NOA" address="0x00009888" value="0x1E7D2800" />
+        <register type="NOA" address="0x00009888" value="0x1A192000" />
+        <register type="NOA" address="0x00009888" value="0x1C190001" />
+        <register type="NOA" address="0x00009888" value="0x1E140028" />
+        <register type="NOA" address="0x00009888" value="0x0A1500C0" />
+        <register type="NOA" address="0x00009888" value="0x1A164000" />
+        <register type="NOA" address="0x00009888" value="0x1C160002" />
+        <register type="NOA" address="0x00009888" value="0x0C18AFA7" />
+        <register type="NOA" address="0x00009888" value="0x10180000" />
+        <register type="NOA" address="0x00009888" value="0x1C390014" />
+        <register type="NOA" address="0x00009888" value="0x1E340280" />
+        <register type="NOA" address="0x00009888" value="0x0A350300" />
+        <register type="NOA" address="0x00009888" value="0x1C360028" />
+        <register type="NOA" address="0x00009888" value="0x0E38AFA7" />
+        <register type="NOA" address="0x00009888" value="0x10380000" />
+        <register type="NOA" address="0x00009888" value="0x06F48000" />
+        <register type="NOA" address="0x00009888" value="0x08F42000" />
+        <register type="NOA" address="0x00009888" value="0x06F58000" />
+        <register type="NOA" address="0x00009888" value="0x08F52000" />
+        <register type="NOA" address="0x00009888" value="0x0EF6000A" />
+        <register type="NOA" address="0x00009888" value="0x06F7C000" />
+        <register type="NOA" address="0x00009888" value="0x08F7C000" />
+        <register type="NOA" address="0x00009888" value="0x0AF74000" />
+        <register type="NOA" address="0x00009888" value="0x0CF74000" />
+        <register type="NOA" address="0x00009888" value="0x0AFB00A0" />
+        <register type="NOA" address="0x00009888" value="0x0AFC8000" />
+        <register type="NOA" address="0x00009888" value="0x0CFC8000" />
+        <register type="NOA" address="0x00009888" value="0x1CFD0A00" />
+        <register type="NOA" address="0x00009888" value="0x06994000" />
+        <register type="NOA" address="0x00009888" value="0x08994000" />
+        <register type="NOA" address="0x00009888" value="0x1C94000A" />
+        <register type="NOA" address="0x00009888" value="0x08956000" />
+        <register type="NOA" address="0x00009888" value="0x06968000" />
+        <register type="NOA" address="0x00009888" value="0x08968000" />
+        <register type="NOA" address="0x00009888" value="0x0298A700" />
+        <register type="NOA" address="0x00009888" value="0x049800AF" />
+        <register type="NOA" address="0x00009888" value="0x10980000" />
+        <register type="NOA" address="0x00009888" value="0x0AB94000" />
+        <register type="NOA" address="0x00009888" value="0x0CB94000" />
+        <register type="NOA" address="0x00009888" value="0x1CB400A0" />
+        <register type="NOA" address="0x00009888" value="0x08B58000" />
+        <register type="NOA" address="0x00009888" value="0x0AB50001" />
+        <register type="NOA" address="0x00009888" value="0x0AB68000" />
+        <register type="NOA" address="0x00009888" value="0x0CB68000" />
+        <register type="NOA" address="0x00009888" value="0x04B8A700" />
+        <register type="NOA" address="0x00009888" value="0x06B800AF" />
+        <register type="NOA" address="0x00009888" value="0x10B80000" />
+        <register type="NOA" address="0x00009888" value="0x02594000" />
+        <register type="NOA" address="0x00009888" value="0x04594000" />
+        <register type="NOA" address="0x00009888" value="0x1A54A000" />
+        <register type="NOA" address="0x00009888" value="0x00558000" />
+        <register type="NOA" address="0x00009888" value="0x08551000" />
+        <register type="NOA" address="0x00009888" value="0x02568000" />
+        <register type="NOA" address="0x00009888" value="0x04568000" />
+        <register type="NOA" address="0x00009888" value="0x0058A700" />
+        <register type="NOA" address="0x00009888" value="0x025800AF" />
+        <register type="NOA" address="0x00009888" value="0x10580000" />
+        <register type="NOA" address="0x00009884" value="0x00000007" />
+        <register type="NOA" address="0x00009888" value="0x21003000" />
+        <register type="NOA" address="0x00009888" value="0x27000071" />
+        <register type="NOA" address="0x00009888" value="0x33000000" />
+        <register type="NOA" address="0x00009888" value="0x2900C000" />
+        <register type="NOA" address="0x00009888" value="0x2B00C000" />
+        <register type="NOA" address="0x00009888" value="0x2D00C000" />
+        <register type="NOA" address="0x00009888" value="0x2F00C000" />
+        <register type="NOA" address="0x00009888" value="0x1300C000" />
+        <register type="NOA" address="0x00009888" value="0x1500C000" />
+        <register type="NOA" address="0x00009888" value="0x1700C000" />
+        <register type="NOA" address="0x00009888" value="0x1900C000" />
+        <register type="NOA" address="0x00009888" value="0x1B00C000" />
+        <register type="NOA" address="0x00009888" value="0x1D00C000" />
+        <register type="NOA" address="0x00009888" value="0x4B003000" />
+        <register type="NOA" address="0x00009888" value="0x3F002C00" />
+        <register type="NOA" address="0x00009888" value="0x4D001111" />
+        <register type="NOA" address="0x00009888" value="0x41000421" />
+        <register type="NOA" address="0x00009888" value="0x35000000" />
+        <register type="NOA" address="0x00009888" value="0x31000000" />
+        <register type="NOA" address="0x00009888" value="0x43000001" />
+        <register type="NOA" address="0x00009888" value="0x47000000" />
+        <register type="NOA" address="0x00009888" value="0x39001080" />
+        <register type="NOA" address="0x00009888" value="0x3B000000" />
+        <register type="NOA" address="0x00009888" value="0x49000000" />
+        <register type="NOA" address="0x00009888" value="0x3D000000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+    </register_config>
+  </set>
+
+  <set name="Metric set TestOa"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="test_oa"
+       hw_config_guid="db41edd4-d8e7-4730-ad11-b9a2d6833503"
+       chipset="CNL"
+       symbol_name="TestOa"
+       >
+    <counter name="TestCounter7"
+             description="HW test counter 7. Factor: 0.6666"
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="counter7"
+             units="events"
+             symbol_name="Counter7"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="TestCounter8"
+             description="HW test counter 8. Should be equal to 1."
+             data_type="uint64"
+             equation="C 7 READ"
+             underscore_name="counter8"
+             units="events"
+             symbol_name="Counter8"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter4"
+             description="HW test counter 4. Factor: 0.3333"
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="counter4"
+             units="events"
+             symbol_name="Counter4"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter5"
+             description="HW test counter 5. Factor: 0.3333"
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="counter5"
+             units="events"
+             symbol_name="Counter5"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter6"
+             description="HW test counter 6. Factor: 0.16666"
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="counter6"
+             units="events"
+             symbol_name="Counter6"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter3"
+             description="HW test counter 3. Factor: 0.5"
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="counter3"
+             units="events"
+             symbol_name="Counter3"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter0"
+             description="HW test counter 0. Factor: 0.0"
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="counter0"
+             units="events"
+             symbol_name="Counter0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter1"
+             description="HW test counter 1. Factor: 1.0"
+             data_type="uint64"
+             equation="B 1 READ"
+             underscore_name="counter1"
+             units="events"
+             symbol_name="Counter1"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter2"
+             description="HW test counter 2. Factor: 1.0"
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="counter2"
+             units="events"
+             symbol_name="Counter2"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009884" value="0x00000007" />
+        <register type="NOA" address="0x00009888" value="0x17060000" />
+        <register type="NOA" address="0x00009840" value="0x00000000" />
+        <register type="NOA" address="0x00009884" value="0x00000007" />
+        <register type="NOA" address="0x00009888" value="0x13034000" />
+        <register type="NOA" address="0x00009884" value="0x00000007" />
+        <register type="NOA" address="0x00009888" value="0x07060066" />
+        <register type="NOA" address="0x00009884" value="0x00000007" />
+        <register type="NOA" address="0x00009888" value="0x05060000" />
+        <register type="NOA" address="0x00009884" value="0x00000007" />
+        <register type="NOA" address="0x00009888" value="0x0F080040" />
+        <register type="NOA" address="0x00009884" value="0x00000007" />
+        <register type="NOA" address="0x00009888" value="0x07091000" />
+        <register type="NOA" address="0x00009884" value="0x00000007" />
+        <register type="NOA" address="0x00009888" value="0x0F041000" />
+        <register type="NOA" address="0x00009884" value="0x00000007" />
+        <register type="NOA" address="0x00009888" value="0x1D004000" />
+        <register type="NOA" address="0x00009884" value="0x00000007" />
+        <register type="NOA" address="0x00009888" value="0x35000000" />
+        <register type="NOA" address="0x00009884" value="0x00000007" />
+        <register type="NOA" address="0x00009888" value="0x49000000" />
+        <register type="NOA" address="0x00009884" value="0x00000007" />
+        <register type="NOA" address="0x00009888" value="0x3D000000" />
+        <register type="NOA" address="0x00009884" value="0x00000007" />
+        <register type="NOA" address="0x00009888" value="0x31000000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002770" value="0x00000004" />
+        <register type="OA" address="0x00002774" value="0x0000FFFF" />
+        <register type="OA" address="0x00002778" value="0x00000003" />
+        <register type="OA" address="0x0000277C" value="0x0000FFFF" />
+        <register type="OA" address="0x00002780" value="0x00000007" />
+        <register type="OA" address="0x00002784" value="0x0000FFFF" />
+        <register type="OA" address="0x00002788" value="0x00100002" />
+        <register type="OA" address="0x0000278C" value="0x0000FFF7" />
+        <register type="OA" address="0x00002790" value="0x00100002" />
+        <register type="OA" address="0x00002794" value="0x0000FFCF" />
+        <register type="OA" address="0x00002798" value="0x00100082" />
+        <register type="OA" address="0x0000279C" value="0x0000FFEF" />
+        <register type="OA" address="0x000027A0" value="0x001000C2" />
+        <register type="OA" address="0x000027A4" value="0x0000FFE7" />
+        <register type="OA" address="0x000027A8" value="0x00100001" />
+        <register type="OA" address="0x000027AC" value="0x0000FFE7" />
+    </register_config>
+  </set>
+
+</metrics>
diff --git a/lib/i915/perf-configs/oa-glk.xml b/lib/i915/perf-configs/oa-glk.xml
new file mode 100644
index 00000000..e32c5c4c
--- /dev/null
+++ b/lib/i915/perf-configs/oa-glk.xml
@@ -0,0 +1,9346 @@
+<?xml version="1.0"?>
+<metrics version="1581935520" merge_md5="">
+  <set name="Render Metrics Basic Gen9"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="render_basic"
+       hw_config_guid="d72df5c7-5b4a-4274-a43f-00b0fd51fc68"
+       chipset="GLK"
+       symbol_name="RenderBasic"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Misses"
+             description="The total number of L3 misses."
+             data_type="uint64"
+             equation="C 4 READ"
+             underscore_name="l3_misses"
+             units="messages"
+             symbol_name="L3Misses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/TAG"
+             />
+    <counter name="GTI L3 Throughput"
+             description="The total number of GPU memory bytes transferred between L3 caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="$L3Misses 64 UMUL"
+             underscore_name="gti_l3_throughput"
+             units="bytes"
+             symbol_name="GtiL3Throughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Cache Misses"
+             description="The total number of sampler cache misses in all LODs in all sampler units."
+             data_type="uint64"
+             equation="B 4 READ 8 UMUL"
+             underscore_name="sampler_l1_misses"
+             units="messages"
+             symbol_name="SamplerL1Misses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler 1 Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which Sampler 1 has been slowing down the pipe when processing EU requests."
+             data_type="float"
+             high_watermark="15"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="sampler1_bottleneck"
+             units="percent"
+             symbol_name="Sampler1Bottleneck"
+             availability="$SubsliceMask 0x12 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="L3 Sampler Throughput"
+             description="The total number of GPU memory bytes transferred between samplers and L3 caches."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="$SamplerL1Misses 64 UMUL"
+             underscore_name="l3_sampler_throughput"
+             units="bytes"
+             symbol_name="L3SamplerThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Sampler"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Sampler 0 Busy"
+             description="The percentage of time in which Sampler 0 has been processing EU requests."
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler0_busy"
+             units="percent"
+             symbol_name="Sampler0Busy"
+             availability="$SubsliceMask 0x09 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Sampler 1 Busy"
+             description="The percentage of time in which Sampler 1 has been processing EU requests."
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler1_busy"
+             units="percent"
+             symbol_name="Sampler1Busy"
+             availability="$SubsliceMask 0x12 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Samplers Busy"
+             description="The percentage of time in which samplers have been processing EU requests."
+             data_type="float"
+             max_equation="100"
+             equation="$Sampler0Busy $Sampler1Busy FMAX"
+             underscore_name="samplers_busy"
+             units="percent"
+             symbol_name="SamplersBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="GTI Fixed Pipe Throughput"
+             description="The total number of GPU memory bytes transferred between 3D Pipeline (Command Dispatch, Input Assembly and Stream Output) and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="B 6 READ B 7 READ UADD 64 UMUL"
+             underscore_name="gti_vf_throughput"
+             units="bytes"
+             symbol_name="GtiVfThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/3D Pipe"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler 0 Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which Sampler 0 has been slowing down the pipe when processing EU requests."
+             data_type="float"
+             high_watermark="15"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="sampler0_bottleneck"
+             units="percent"
+             symbol_name="Sampler0Bottleneck"
+             availability="$SubsliceMask 0x09 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="L3 Lookup Accesses w/o IC"
+             description="The total number of L3 cache lookup accesses w/o IC."
+             data_type="uint64"
+             equation="$SamplerL1Misses $ShaderMemoryAccesses UADD"
+             underscore_name="l3_lookups"
+             units="messages"
+             symbol_name="L3Lookups"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/TAG"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Read Throughput"
+             description="The total number of GPU memory bytes read from GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="C 6 READ 64 UMUL"
+             underscore_name="gti_read_throughput"
+             units="bytes"
+             symbol_name="GtiReadThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Depth Throughput"
+             description="The total number of GPU memory bytes transferred between depth caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 0 READ C 1 READ UADD 64 UMUL"
+             underscore_name="gti_depth_throughput"
+             units="bytes"
+             symbol_name="GtiDepthThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/Depth Cache"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Samplers Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which samplers have been slowing down the pipe when processing EU requests."
+             data_type="float"
+             high_watermark="15"
+             equation="$Sampler0Bottleneck $Sampler1Bottleneck FMAX"
+             max_equation="100"
+             underscore_name="sampler_bottleneck"
+             units="percent"
+             symbol_name="SamplerBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Indicate System Frame Batch Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="GTI HDC TLB Lookup Throughput"
+             description="The total number of GPU memory bytes transferred between GTI and HDC, when HDC is doing TLB lookups."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 5 READ 64 UMUL"
+             underscore_name="gti_hdc_lookups_throughput"
+             units="bytes"
+             symbol_name="GtiHdcLookupsThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI RCC Throughput"
+             description="The total number of GPU memory bytes transferred between render color caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 2 READ C 3 READ UADD 64 UMUL"
+             underscore_name="gti_rcc_throughput"
+             units="bytes"
+             symbol_name="GtiRccThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/Color Cache"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="GTI Write Throughput"
+             description="The total number of GPU memory bytes written to GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 32 UMUL"
+             equation="C 7 READ 64 UMUL"
+             underscore_name="gti_write_throughput"
+             units="bytes"
+             symbol_name="GtiWriteThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x166C00F0" />
+        <register type="NOA" address="0x00009888" value="0x12120280" />
+        <register type="NOA" address="0x00009888" value="0x12320280" />
+        <register type="NOA" address="0x00009888" value="0x11930317" />
+        <register type="NOA" address="0x00009888" value="0x159303DF" />
+        <register type="NOA" address="0x00009888" value="0x3F900C00" />
+        <register type="NOA" address="0x00009888" value="0x419000A0" />
+        <register type="NOA" address="0x00009888" value="0x002D1000" />
+        <register type="NOA" address="0x00009888" value="0x062D4000" />
+        <register type="NOA" address="0x00009888" value="0x082D5000" />
+        <register type="NOA" address="0x00009888" value="0x0A2D1000" />
+        <register type="NOA" address="0x00009888" value="0x0C2E0800" />
+        <register type="NOA" address="0x00009888" value="0x0E2E5900" />
+        <register type="NOA" address="0x00009888" value="0x0A4C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C4C8000" />
+        <register type="NOA" address="0x00009888" value="0x0E4C4000" />
+        <register type="NOA" address="0x00009888" value="0x064E8000" />
+        <register type="NOA" address="0x00009888" value="0x084E8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4E2000" />
+        <register type="NOA" address="0x00009888" value="0x1C4F0010" />
+        <register type="NOA" address="0x00009888" value="0x0A6C0053" />
+        <register type="NOA" address="0x00009888" value="0x106C0000" />
+        <register type="NOA" address="0x00009888" value="0x1C6C0000" />
+        <register type="NOA" address="0x00009888" value="0x1A0FCC00" />
+        <register type="NOA" address="0x00009888" value="0x1C0F0002" />
+        <register type="NOA" address="0x00009888" value="0x1C2C0040" />
+        <register type="NOA" address="0x00009888" value="0x00101000" />
+        <register type="NOA" address="0x00009888" value="0x04101000" />
+        <register type="NOA" address="0x00009888" value="0x00114000" />
+        <register type="NOA" address="0x00009888" value="0x08114000" />
+        <register type="NOA" address="0x00009888" value="0x00120020" />
+        <register type="NOA" address="0x00009888" value="0x08120021" />
+        <register type="NOA" address="0x00009888" value="0x00141000" />
+        <register type="NOA" address="0x00009888" value="0x08141000" />
+        <register type="NOA" address="0x00009888" value="0x02308000" />
+        <register type="NOA" address="0x00009888" value="0x04302000" />
+        <register type="NOA" address="0x00009888" value="0x06318000" />
+        <register type="NOA" address="0x00009888" value="0x08318000" />
+        <register type="NOA" address="0x00009888" value="0x06320800" />
+        <register type="NOA" address="0x00009888" value="0x08320840" />
+        <register type="NOA" address="0x00009888" value="0x00320000" />
+        <register type="NOA" address="0x00009888" value="0x06344000" />
+        <register type="NOA" address="0x00009888" value="0x08344000" />
+        <register type="NOA" address="0x00009888" value="0x0D931831" />
+        <register type="NOA" address="0x00009888" value="0x0F939F3F" />
+        <register type="NOA" address="0x00009888" value="0x01939E80" />
+        <register type="NOA" address="0x00009888" value="0x039303BC" />
+        <register type="NOA" address="0x00009888" value="0x0593000E" />
+        <register type="NOA" address="0x00009888" value="0x1993002A" />
+        <register type="NOA" address="0x00009888" value="0x07930000" />
+        <register type="NOA" address="0x00009888" value="0x09930000" />
+        <register type="NOA" address="0x00009888" value="0x1D900177" />
+        <register type="NOA" address="0x00009888" value="0x1F900187" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x13904000" />
+        <register type="NOA" address="0x00009888" value="0x21904000" />
+        <register type="NOA" address="0x00009888" value="0x23904000" />
+        <register type="NOA" address="0x00009888" value="0x25904000" />
+        <register type="NOA" address="0x00009888" value="0x27904000" />
+        <register type="NOA" address="0x00009888" value="0x2B904000" />
+        <register type="NOA" address="0x00009888" value="0x2D904000" />
+        <register type="NOA" address="0x00009888" value="0x2F904000" />
+        <register type="NOA" address="0x00009888" value="0x31904000" />
+        <register type="NOA" address="0x00009888" value="0x15904000" />
+        <register type="NOA" address="0x00009888" value="0x17904000" />
+        <register type="NOA" address="0x00009888" value="0x19904000" />
+        <register type="NOA" address="0x00009888" value="0x1B904000" />
+        <register type="NOA" address="0x00009888" value="0x53901110" />
+        <register type="NOA" address="0x00009888" value="0x43900423" />
+        <register type="NOA" address="0x00009888" value="0x55900111" />
+        <register type="NOA" address="0x00009888" value="0x47900C02" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900020" />
+        <register type="NOA" address="0x00009888" value="0x59901111" />
+        <register type="NOA" address="0x00009888" value="0x4B900421" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4D900001" />
+        <register type="NOA" address="0x00009888" value="0x45900821" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Compute Metrics Basic Gen9"
+       mdapi_supported_apis="VK OGL4 OCL IO BB"
+       underscore_name="compute_basic"
+       hw_config_guid="814285f6-354d-41d2-ba49-e24e622714a0"
+       chipset="GLK"
+       symbol_name="ComputeBasic"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Untyped Bytes Read"
+             description="The total number of typed memory bytes read via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="B 6 READ B 7 READ UADD $EuSlicesTotalCount 64 UMUL UMUL"
+             underscore_name="untyped_bytes_read"
+             units="bytes"
+             symbol_name="UntypedBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Typed Bytes Written"
+             description="The total number of untyped memory bytes written via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="B 3 READ B 4 READ UADD $EuSlicesTotalCount 64 UMUL UMUL"
+             underscore_name="typed_bytes_written"
+             units="bytes"
+             symbol_name="TypedBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu0_active"
+             units="percent"
+             symbol_name="Fpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active"
+             units="percent"
+             symbol_name="Fpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU AVG IPC Rate"
+             description="The average rate of IPC calculated for 2 FPU pipelines."
+             data_type="float"
+             max_equation="2"
+             equation="A 9 READ  A 10 READ  A 11 READ UADD  A 9 READ USUB FDIV 1 FADD"
+             underscore_name="eu_avg_ipc_rate"
+             units="number"
+             symbol_name="EuAvgIpcRate"
+             semantic_type="ratio"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Read Throughput"
+             description="The total number of GPU memory bytes read from GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 4 READ 64 UMUL"
+             underscore_name="gti_read_throughput"
+             units="bytes"
+             symbol_name="GtiReadThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Untyped Writes"
+             description="The total number of untyped memory bytes written via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 1 READ C 2 READ UADD $EuSlicesTotalCount 64 UMUL UMUL"
+             underscore_name="untyped_bytes_written"
+             units="bytes"
+             symbol_name="UntypedBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="Typed Bytes Read"
+             description="The total number of typed memory bytes read via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="B 0 READ B 1 READ UADD $EuSlicesTotalCount 64 UMUL UMUL"
+             underscore_name="typed_bytes_read"
+             units="bytes"
+             symbol_name="TypedBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="EU Thread Occupancy"
+             description="The percentage of time in which hardware threads occupied EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ 8 UMUL $EuCoresTotalCount UDIV $EuThreadsCount UDIV 100 UMUL  $GpuCoreClocks FDIV"
+             underscore_name="eu_thread_occupancy"
+             units="percent"
+             symbol_name="EuThreadOccupancy"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="GTI Write Throughput"
+             description="The total number of GPU memory bytes written to GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 32 UMUL"
+             equation="C 5 READ 64 UMUL"
+             underscore_name="gti_write_throughput"
+             units="bytes"
+             symbol_name="GtiWriteThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="EU Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_send_active"
+             units="percent"
+             symbol_name="EuSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x104F00E0" />
+        <register type="NOA" address="0x00009888" value="0x124F1C00" />
+        <register type="NOA" address="0x00009888" value="0x39900340" />
+        <register type="NOA" address="0x00009888" value="0x3F900C00" />
+        <register type="NOA" address="0x00009888" value="0x41900000" />
+        <register type="NOA" address="0x00009888" value="0x002D5000" />
+        <register type="NOA" address="0x00009888" value="0x062D4000" />
+        <register type="NOA" address="0x00009888" value="0x082D4000" />
+        <register type="NOA" address="0x00009888" value="0x0A2D1000" />
+        <register type="NOA" address="0x00009888" value="0x0C2D5000" />
+        <register type="NOA" address="0x00009888" value="0x0E2D4000" />
+        <register type="NOA" address="0x00009888" value="0x0C2E1400" />
+        <register type="NOA" address="0x00009888" value="0x0E2E5100" />
+        <register type="NOA" address="0x00009888" value="0x102E0114" />
+        <register type="NOA" address="0x00009888" value="0x044CC000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C4C8000" />
+        <register type="NOA" address="0x00009888" value="0x0E4C4000" />
+        <register type="NOA" address="0x00009888" value="0x104C8000" />
+        <register type="NOA" address="0x00009888" value="0x124C8000" />
+        <register type="NOA" address="0x00009888" value="0x164C2000" />
+        <register type="NOA" address="0x00009888" value="0x004EA000" />
+        <register type="NOA" address="0x00009888" value="0x064E8000" />
+        <register type="NOA" address="0x00009888" value="0x084E8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4E2000" />
+        <register type="NOA" address="0x00009888" value="0x0C4EA000" />
+        <register type="NOA" address="0x00009888" value="0x0E4E8000" />
+        <register type="NOA" address="0x00009888" value="0x004F6B42" />
+        <register type="NOA" address="0x00009888" value="0x064F6200" />
+        <register type="NOA" address="0x00009888" value="0x084F4100" />
+        <register type="NOA" address="0x00009888" value="0x0A4F0061" />
+        <register type="NOA" address="0x00009888" value="0x0C4F6C4C" />
+        <register type="NOA" address="0x00009888" value="0x0E4F4B00" />
+        <register type="NOA" address="0x00009888" value="0x1A4F0000" />
+        <register type="NOA" address="0x00009888" value="0x1C4F0000" />
+        <register type="NOA" address="0x00009888" value="0x180F5000" />
+        <register type="NOA" address="0x00009888" value="0x1A0F8800" />
+        <register type="NOA" address="0x00009888" value="0x1C0F08A2" />
+        <register type="NOA" address="0x00009888" value="0x182C4000" />
+        <register type="NOA" address="0x00009888" value="0x1C2C1451" />
+        <register type="NOA" address="0x00009888" value="0x1E2C0001" />
+        <register type="NOA" address="0x00009888" value="0x1A2C0010" />
+        <register type="NOA" address="0x00009888" value="0x01938000" />
+        <register type="NOA" address="0x00009888" value="0x0F938000" />
+        <register type="NOA" address="0x00009888" value="0x19938A28" />
+        <register type="NOA" address="0x00009888" value="0x03938000" />
+        <register type="NOA" address="0x00009888" value="0x19900177" />
+        <register type="NOA" address="0x00009888" value="0x1B900178" />
+        <register type="NOA" address="0x00009888" value="0x1D900125" />
+        <register type="NOA" address="0x00009888" value="0x1F900123" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x13904000" />
+        <register type="NOA" address="0x00009888" value="0x21904000" />
+        <register type="NOA" address="0x00009888" value="0x25904000" />
+        <register type="NOA" address="0x00009888" value="0x27904000" />
+        <register type="NOA" address="0x00009888" value="0x2B904000" />
+        <register type="NOA" address="0x00009888" value="0x2D904000" />
+        <register type="NOA" address="0x00009888" value="0x31904000" />
+        <register type="NOA" address="0x00009888" value="0x15904000" />
+        <register type="NOA" address="0x00009888" value="0x53901000" />
+        <register type="NOA" address="0x00009888" value="0x43900000" />
+        <register type="NOA" address="0x00009888" value="0x55900111" />
+        <register type="NOA" address="0x00009888" value="0x47900000" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900000" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4D900000" />
+        <register type="NOA" address="0x00009888" value="0x45900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00000003" />
+        <register type="FLEX" address="0x0000E658" value="0x00002001" />
+        <register type="FLEX" address="0x0000E758" value="0x00778008" />
+        <register type="FLEX" address="0x0000E45C" value="0x00088078" />
+        <register type="FLEX" address="0x0000E55C" value="0x00808708" />
+        <register type="FLEX" address="0x0000E65C" value="0x00A08908" />
+    </register_config>
+  </set>
+
+  <set name="Render Metrics for 3D Pipeline Profile Gen9"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="render_pipe_profile"
+       hw_config_guid="07d397a6-b3e6-49f6-9433-a4f293d55978"
+       chipset="GLK"
+       symbol_name="RenderPipeProfile"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Bottleneck"
+             low_watermark="10"
+             description="The percentage of time in which vertex shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="30"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_bottleneck"
+             units="percent"
+             symbol_name="VsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Hi-Depth Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which early hierarchical depth test pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="hi_depth_bottleneck"
+             units="percent"
+             symbol_name="HiDepthBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which geometry shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gs_bottleneck"
+             units="percent"
+             symbol_name="GsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Geometry Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="BC Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which barycentric coordinates calculation pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="bc_bottleneck"
+             units="percent"
+             symbol_name="BcBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Barycentric Calc"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HS Stall"
+             description="The percentage of time in which hull stall pipeline stage was stalled."
+             data_type="float"
+             equation="C 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="hs_stall"
+             units="percent"
+             symbol_name="HsStall"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Hull Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="VF Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which vertex fetch pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="C 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vf_bottleneck"
+             units="percent"
+             symbol_name="VfBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Input Assembler"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Strip-Fans Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which strip-fans pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="10"
+             equation="B 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sf_bottleneck"
+             units="percent"
+             symbol_name="SfBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Strip-Fans"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SF Stall"
+             description="The percentage of time in which strip-fans pipeline stage was stalled."
+             data_type="float"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sf_stall"
+             units="percent"
+             symbol_name="SfStall"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Strip-Fans"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HS Bottleneck"
+             low_watermark="3"
+             description="The percentage of time in which hull shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="9"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="hs_bottleneck"
+             units="percent"
+             symbol_name="HsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Hull Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="CL Stall"
+             description="The percentage of time in which clipper pipeline stage was stalled."
+             data_type="float"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="cl_stall"
+             units="percent"
+             symbol_name="ClStall"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Clipper"
+             />
+    <counter name="SO Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which stream output pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="so_bottleneck"
+             units="percent"
+             symbol_name="SoBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Stream Output"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="DS Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which domain shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ds_bottleneck"
+             units="percent"
+             symbol_name="DsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Domain Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Clipper Bottleneck"
+             low_watermark="10"
+             description="The percentage of time in which clipper pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="30"
+             equation="B 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="cl_bottleneck"
+             units="percent"
+             symbol_name="ClBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Clipper"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Stall"
+             description="The percentage of time in which domain shader pipeline stage was stalled."
+             data_type="float"
+             equation="C 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ds_stall"
+             units="percent"
+             symbol_name="DsStall"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Domain Shader"
+             />
+    <counter name="Early Depth Bottleneck"
+             low_watermark="10"
+             description="The percentage of time in which early depth test pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="30"
+             equation="B 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="early_depth_bottleneck"
+             units="percent"
+             symbol_name="EarlyDepthBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="SO Stall"
+             description="The percentage of time in which stream-output pipeline stage was stalled."
+             data_type="float"
+             equation="C 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="so_stall"
+             units="percent"
+             symbol_name="SoStall"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Stream Output"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x0C2E001F" />
+        <register type="NOA" address="0x00009888" value="0x0A2F0000" />
+        <register type="NOA" address="0x00009888" value="0x10186800" />
+        <register type="NOA" address="0x00009888" value="0x11810019" />
+        <register type="NOA" address="0x00009888" value="0x15810013" />
+        <register type="NOA" address="0x00009888" value="0x13820020" />
+        <register type="NOA" address="0x00009888" value="0x11830020" />
+        <register type="NOA" address="0x00009888" value="0x17840000" />
+        <register type="NOA" address="0x00009888" value="0x11860007" />
+        <register type="NOA" address="0x00009888" value="0x21860000" />
+        <register type="NOA" address="0x00009888" value="0x178703E0" />
+        <register type="NOA" address="0x00009888" value="0x0C2D8000" />
+        <register type="NOA" address="0x00009888" value="0x042D4000" />
+        <register type="NOA" address="0x00009888" value="0x062D1000" />
+        <register type="NOA" address="0x00009888" value="0x022E5400" />
+        <register type="NOA" address="0x00009888" value="0x002E0000" />
+        <register type="NOA" address="0x00009888" value="0x0E2E0080" />
+        <register type="NOA" address="0x00009888" value="0x082F0040" />
+        <register type="NOA" address="0x00009888" value="0x002F0000" />
+        <register type="NOA" address="0x00009888" value="0x06143000" />
+        <register type="NOA" address="0x00009888" value="0x06174000" />
+        <register type="NOA" address="0x00009888" value="0x06180012" />
+        <register type="NOA" address="0x00009888" value="0x00180000" />
+        <register type="NOA" address="0x00009888" value="0x0D804000" />
+        <register type="NOA" address="0x00009888" value="0x0F804000" />
+        <register type="NOA" address="0x00009888" value="0x05804000" />
+        <register type="NOA" address="0x00009888" value="0x09810200" />
+        <register type="NOA" address="0x00009888" value="0x0B810030" />
+        <register type="NOA" address="0x00009888" value="0x03810003" />
+        <register type="NOA" address="0x00009888" value="0x21819140" />
+        <register type="NOA" address="0x00009888" value="0x23819050" />
+        <register type="NOA" address="0x00009888" value="0x25810018" />
+        <register type="NOA" address="0x00009888" value="0x0B820980" />
+        <register type="NOA" address="0x00009888" value="0x03820D80" />
+        <register type="NOA" address="0x00009888" value="0x11820000" />
+        <register type="NOA" address="0x00009888" value="0x0182C000" />
+        <register type="NOA" address="0x00009888" value="0x07828000" />
+        <register type="NOA" address="0x00009888" value="0x09824000" />
+        <register type="NOA" address="0x00009888" value="0x0F828000" />
+        <register type="NOA" address="0x00009888" value="0x0D830004" />
+        <register type="NOA" address="0x00009888" value="0x0583000C" />
+        <register type="NOA" address="0x00009888" value="0x0F831000" />
+        <register type="NOA" address="0x00009888" value="0x01848072" />
+        <register type="NOA" address="0x00009888" value="0x11840000" />
+        <register type="NOA" address="0x00009888" value="0x07848000" />
+        <register type="NOA" address="0x00009888" value="0x09844000" />
+        <register type="NOA" address="0x00009888" value="0x0F848000" />
+        <register type="NOA" address="0x00009888" value="0x07860000" />
+        <register type="NOA" address="0x00009888" value="0x09860092" />
+        <register type="NOA" address="0x00009888" value="0x0F860400" />
+        <register type="NOA" address="0x00009888" value="0x01869100" />
+        <register type="NOA" address="0x00009888" value="0x0F870065" />
+        <register type="NOA" address="0x00009888" value="0x01870000" />
+        <register type="NOA" address="0x00009888" value="0x19930800" />
+        <register type="NOA" address="0x00009888" value="0x0B938000" />
+        <register type="NOA" address="0x00009888" value="0x0D938000" />
+        <register type="NOA" address="0x00009888" value="0x1B952000" />
+        <register type="NOA" address="0x00009888" value="0x1D955055" />
+        <register type="NOA" address="0x00009888" value="0x1F951455" />
+        <register type="NOA" address="0x00009888" value="0x0992A000" />
+        <register type="NOA" address="0x00009888" value="0x0F928000" />
+        <register type="NOA" address="0x00009888" value="0x1192A800" />
+        <register type="NOA" address="0x00009888" value="0x1392028A" />
+        <register type="NOA" address="0x00009888" value="0x0B92A000" />
+        <register type="NOA" address="0x00009888" value="0x0D922000" />
+        <register type="NOA" address="0x00009888" value="0x13908000" />
+        <register type="NOA" address="0x00009888" value="0x21908000" />
+        <register type="NOA" address="0x00009888" value="0x23908000" />
+        <register type="NOA" address="0x00009888" value="0x25908000" />
+        <register type="NOA" address="0x00009888" value="0x27908000" />
+        <register type="NOA" address="0x00009888" value="0x29908000" />
+        <register type="NOA" address="0x00009888" value="0x2B908000" />
+        <register type="NOA" address="0x00009888" value="0x2D904000" />
+        <register type="NOA" address="0x00009888" value="0x2F908000" />
+        <register type="NOA" address="0x00009888" value="0x31908000" />
+        <register type="NOA" address="0x00009888" value="0x15908000" />
+        <register type="NOA" address="0x00009888" value="0x17908000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B908000" />
+        <register type="NOA" address="0x00009888" value="0x1D904000" />
+        <register type="NOA" address="0x00009888" value="0x1F904000" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x43900C01" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x47900000" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900863" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900061" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4D900000" />
+        <register type="NOA" address="0x00009888" value="0x45900C22" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007FFEA" />
+        <register type="OA" address="0x00002774" value="0x00007FFC" />
+        <register type="OA" address="0x00002778" value="0x0007AFFA" />
+        <register type="OA" address="0x0000277C" value="0x0000F5FD" />
+        <register type="OA" address="0x00002780" value="0x00079FFA" />
+        <register type="OA" address="0x00002784" value="0x0000F3FB" />
+        <register type="OA" address="0x00002788" value="0x0007BF7A" />
+        <register type="OA" address="0x0000278C" value="0x0000F7E7" />
+        <register type="OA" address="0x00002790" value="0x0007FEFA" />
+        <register type="OA" address="0x00002794" value="0x0000F7CF" />
+        <register type="OA" address="0x00002798" value="0x00077FFA" />
+        <register type="OA" address="0x0000279C" value="0x0000EFDF" />
+        <register type="OA" address="0x000027A0" value="0x0006FFFA" />
+        <register type="OA" address="0x000027A4" value="0x0000CFBF" />
+        <register type="OA" address="0x000027A8" value="0x0003FFFA" />
+        <register type="OA" address="0x000027AC" value="0x00005F7F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00015014" />
+        <register type="FLEX" address="0x0000E658" value="0x00025024" />
+        <register type="FLEX" address="0x0000E758" value="0x00035034" />
+        <register type="FLEX" address="0x0000E45C" value="0x00045044" />
+        <register type="FLEX" address="0x0000E55C" value="0x00055054" />
+        <register type="FLEX" address="0x0000E65C" value="0x00065064" />
+    </register_config>
+  </set>
+
+  <set name="Memory Reads Distribution Gen9"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="memory_reads"
+       hw_config_guid="1a356946-5428-450b-a2f0-89f8783a302d"
+       chipset="GLK"
+       symbol_name="MemoryReads"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiL3Bank0Reads"
+             description="The total number of GTI memory reads from L3 Bank 0 (L3 Cache misses)."
+             data_type="uint64"
+             equation="C 4 READ"
+             underscore_name="gti_l3_bank0_reads"
+             units="messages"
+             symbol_name="GtiL3Bank0Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="GtiRingAccesses"
+             description="The total number of all accesses from GTI to the ring."
+             data_type="uint64"
+             equation="C 3 READ 2 UMUL"
+             underscore_name="gti_ring_accesses"
+             units="messages"
+             symbol_name="GtiRingAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="GtiL3Bank3Reads"
+             description="The total number of GTI memory reads from L3 Bank 3 (L3 Cache misses)."
+             data_type="uint64"
+             equation="C 7 READ"
+             underscore_name="gti_l3_bank3_reads"
+             units="messages"
+             symbol_name="GtiL3Bank3Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="GtiRsMemoryReads"
+             description="The total number of GTI memory reads from Resource Streamer."
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="gti_rs_memory_reads"
+             units="messages"
+             symbol_name="GtiRsMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Resource Streamer"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GtiHizMemoryReads"
+             description="The total number of GTI memory reads from Hierarchical Depth Cache (Hi-Depth Cache misses)."
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="gti_hiz_memory_reads"
+             units="messages"
+             symbol_name="GtiHizMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="GtiRccMemoryReads"
+             description="The total number of GTI memory reads from Render Color Cache (Render Color Cache misses)."
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="gti_rcc_memory_reads"
+             units="messages"
+             symbol_name="GtiRccMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Color Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiL3Bank1Reads"
+             description="The total number of GTI memory reads from L3 Bank 1 (L3 Cache misses)."
+             data_type="uint64"
+             equation="C 5 READ"
+             underscore_name="gti_l3_bank1_reads"
+             units="messages"
+             symbol_name="GtiL3Bank1Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiCmdStreamerMemoryReads"
+             description="The total number of GTI memory reads from Command Streamer."
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="gti_cmd_streamer_memory_reads"
+             units="messages"
+             symbol_name="GtiCmdStreamerMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Command Streamer"
+             />
+    <counter name="GtiL3Bank2Reads"
+             description="The total number of GTI memory reads from L3 Bank 2 (L3 Cache misses)."
+             data_type="uint64"
+             equation="C 6 READ"
+             underscore_name="gti_l3_bank2_reads"
+             units="messages"
+             symbol_name="GtiL3Bank2Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiMemoryReads"
+             description="The total number of GTI memory reads."
+             data_type="uint64"
+             equation="C 0 READ"
+             underscore_name="gti_memory_reads"
+             units="messages"
+             symbol_name="GtiMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="GtiRczMemoryReads"
+             description="The total number of GTI memory reads from Render Depth Cache (Render Depth Cache misses)."
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="gti_rcz_memory_reads"
+             units="messages"
+             symbol_name="GtiRczMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="GtiMscMemoryReads"
+             description="The total number of GTI memory reads from Multisampling Color Cache (Multisampling Color Cache misses)."
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="gti_msc_memory_reads"
+             units="messages"
+             symbol_name="GtiMscMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Color Cache"
+             />
+    <counter name="GtiVfMemoryReads"
+             description="The total number of GTI memory reads from Vertex Fetch."
+             data_type="uint64"
+             equation="B 1 READ"
+             underscore_name="gti_vf_memory_reads"
+             units="messages"
+             symbol_name="GtiVfMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Vertex Fetch"
+             />
+    <counter name="GtiStcMemoryReads"
+             description="The total number of GTI memory reads from Stencil Cache (Stencil Cache misses)."
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="gti_stc_memory_reads"
+             units="messages"
+             symbol_name="GtiStcMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiL3Reads"
+             description="The total number of GTI memory reads from L3 (L3 Cache misses)."
+             data_type="uint64"
+             equation="$GtiL3Bank0Reads $GtiL3Bank1Reads $GtiL3Bank2Reads $GtiL3Bank3Reads UADD UADD UADD"
+             underscore_name="gti_l3_reads"
+             units="messages"
+             symbol_name="GtiL3Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x19800343" />
+        <register type="NOA" address="0x00009888" value="0x39900340" />
+        <register type="NOA" address="0x00009888" value="0x3F901000" />
+        <register type="NOA" address="0x00009888" value="0x41900003" />
+        <register type="NOA" address="0x00009888" value="0x03803180" />
+        <register type="NOA" address="0x00009888" value="0x058035E2" />
+        <register type="NOA" address="0x00009888" value="0x0780006A" />
+        <register type="NOA" address="0x00009888" value="0x11800000" />
+        <register type="NOA" address="0x00009888" value="0x2181A000" />
+        <register type="NOA" address="0x00009888" value="0x2381000A" />
+        <register type="NOA" address="0x00009888" value="0x1D950550" />
+        <register type="NOA" address="0x00009888" value="0x0B928000" />
+        <register type="NOA" address="0x00009888" value="0x0D92A000" />
+        <register type="NOA" address="0x00009888" value="0x0F922000" />
+        <register type="NOA" address="0x00009888" value="0x13900170" />
+        <register type="NOA" address="0x00009888" value="0x21900171" />
+        <register type="NOA" address="0x00009888" value="0x23900172" />
+        <register type="NOA" address="0x00009888" value="0x25900173" />
+        <register type="NOA" address="0x00009888" value="0x27900174" />
+        <register type="NOA" address="0x00009888" value="0x29900175" />
+        <register type="NOA" address="0x00009888" value="0x2B900176" />
+        <register type="NOA" address="0x00009888" value="0x2D900177" />
+        <register type="NOA" address="0x00009888" value="0x2F90017F" />
+        <register type="NOA" address="0x00009888" value="0x31900125" />
+        <register type="NOA" address="0x00009888" value="0x15900123" />
+        <register type="NOA" address="0x00009888" value="0x17900121" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B908000" />
+        <register type="NOA" address="0x00009888" value="0x1D908000" />
+        <register type="NOA" address="0x00009888" value="0x1F908000" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x43901084" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x47901080" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49901084" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x4B901084" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4D900004" />
+        <register type="NOA" address="0x00009888" value="0x45900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x0000272C" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002728" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x0000271C" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002718" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x0000274C" value="0x86543210" />
+        <register type="OA" address="0x00002748" value="0x86543210" />
+        <register type="OA" address="0x00002744" value="0x00006667" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x0000275C" value="0x86543210" />
+        <register type="OA" address="0x00002758" value="0x86543210" />
+        <register type="OA" address="0x00002754" value="0x00006465" />
+        <register type="OA" address="0x00002750" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007F81A" />
+        <register type="OA" address="0x00002774" value="0x0000FE00" />
+        <register type="OA" address="0x00002778" value="0x0007F82A" />
+        <register type="OA" address="0x0000277C" value="0x0000FE00" />
+        <register type="OA" address="0x00002780" value="0x0007F872" />
+        <register type="OA" address="0x00002784" value="0x0000FE00" />
+        <register type="OA" address="0x00002788" value="0x0007F8BA" />
+        <register type="OA" address="0x0000278C" value="0x0000FE00" />
+        <register type="OA" address="0x00002790" value="0x0007F87A" />
+        <register type="OA" address="0x00002794" value="0x0000FE00" />
+        <register type="OA" address="0x00002798" value="0x0007F8EA" />
+        <register type="OA" address="0x0000279C" value="0x0000FE00" />
+        <register type="OA" address="0x000027A0" value="0x0007F8E2" />
+        <register type="OA" address="0x000027A4" value="0x0000FE00" />
+        <register type="OA" address="0x000027A8" value="0x0007F8F2" />
+        <register type="OA" address="0x000027AC" value="0x0000FE00" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00015014" />
+        <register type="FLEX" address="0x0000E658" value="0x00025024" />
+        <register type="FLEX" address="0x0000E758" value="0x00035034" />
+        <register type="FLEX" address="0x0000E45C" value="0x00045044" />
+        <register type="FLEX" address="0x0000E55C" value="0x00055054" />
+        <register type="FLEX" address="0x0000E65C" value="0x00065064" />
+    </register_config>
+  </set>
+
+  <set name="Memory Writes Distribution Gen9"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="memory_writes"
+       hw_config_guid="5299be9d-7a61-4c99-9f81-f87e6c5aaca9"
+       chipset="GLK"
+       symbol_name="MemoryWrites"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiMemoryWrites"
+             description="The total number of GTI memory writes."
+             data_type="uint64"
+             equation="C 0 READ"
+             underscore_name="gti_memory_writes"
+             units="messages"
+             symbol_name="GtiMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="GtiRingAccesses"
+             description="The total number of all GTI accesses to the ring."
+             data_type="uint64"
+             equation="C 3 READ 2 UMUL"
+             underscore_name="gti_ring_accesses"
+             units="messages"
+             symbol_name="GtiRingAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="GtiMscMemoryWrites"
+             description="The total number of GTI memory writes from Multisampling Color Cache (Multisampling Color Cache invalidations)."
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="gti_msc_memory_writes"
+             units="messages"
+             symbol_name="GtiMscMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Color Cache"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="GtiCmdStreamerMemoryWrites"
+             description="The total number of GTI memory writes from Command Streamer."
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="gti_cmd_streamer_memory_writes"
+             units="messages"
+             symbol_name="GtiCmdStreamerMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Command Streamer"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GtiL3Bank0Writes"
+             description="The total number of GTI memory writes from L3 Bank 0 (L3 Bank 0 invalidations)."
+             data_type="uint64"
+             equation="C 4 READ"
+             underscore_name="gti_l3_bank0_writes"
+             units="messages"
+             symbol_name="GtiL3Bank0Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiL3Bank1Writes"
+             description="The total number of GTI memory writes from L3 Bank 1 (L3 Bank 1 invalidations)."
+             data_type="uint64"
+             equation="C 5 READ"
+             underscore_name="gti_l3_bank1_writes"
+             units="messages"
+             symbol_name="GtiL3Bank1Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiL3Bank2Writes"
+             description="The total number of GTI memory writes from L3 Bank 2 (L3 Bank 2 invalidations)."
+             data_type="uint64"
+             equation="C 6 READ"
+             underscore_name="gti_l3_bank2_writes"
+             units="messages"
+             symbol_name="GtiL3Bank2Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiL3Bank3Writes"
+             description="The total number of GTI memory writes from L3 Bank 3 (L3 Bank 3 invalidations)."
+             data_type="uint64"
+             equation="C 7 READ"
+             underscore_name="gti_l3_bank3_writes"
+             units="messages"
+             symbol_name="GtiL3Bank3Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiL3Writes"
+             description="The total number of GTI memory writes from L3 (L3 invalidations)."
+             data_type="uint64"
+             equation="$GtiL3Bank0Writes $GtiL3Bank1Writes $GtiL3Bank2Writes $GtiL3Bank3Writes UADD UADD UADD"
+             underscore_name="gti_l3_writes"
+             units="messages"
+             symbol_name="GtiL3Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiRccMemoryWrites"
+             description="The total number of GTI memory writes from Render Color Cache (Render Color Cache invalidations)."
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="gti_rcc_memory_writes"
+             units="messages"
+             symbol_name="GtiRccMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Color Cache"
+             />
+    <counter name="GtiSoMemoryWrites"
+             description="The total number of GTI memory writes from Stream Output."
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="gti_so_memory_writes"
+             units="messages"
+             symbol_name="GtiSoMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Stream Output"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiStcMemoryWrites"
+             description="The total number of GTI memory writes from Stencil Cache."
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="gti_stc_memory_writes"
+             units="messages"
+             symbol_name="GtiStcMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="GtiRczMemoryWrites"
+             description="The total number of GTI memory writes from Render Depth Cache."
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="gti_rcz_memory_writes"
+             units="messages"
+             symbol_name="GtiRczMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="GtiHizMemoryWrites"
+             description="The total number of GTI memory writes from Hierarchical Depth Cache."
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="gti_hiz_memory_writes"
+             units="messages"
+             symbol_name="GtiHizMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x19800343" />
+        <register type="NOA" address="0x00009888" value="0x39900340" />
+        <register type="NOA" address="0x00009888" value="0x3F900000" />
+        <register type="NOA" address="0x00009888" value="0x41900080" />
+        <register type="NOA" address="0x00009888" value="0x03803180" />
+        <register type="NOA" address="0x00009888" value="0x058035E2" />
+        <register type="NOA" address="0x00009888" value="0x0780006A" />
+        <register type="NOA" address="0x00009888" value="0x11800000" />
+        <register type="NOA" address="0x00009888" value="0x2181A000" />
+        <register type="NOA" address="0x00009888" value="0x2381000A" />
+        <register type="NOA" address="0x00009888" value="0x1D950550" />
+        <register type="NOA" address="0x00009888" value="0x0B928000" />
+        <register type="NOA" address="0x00009888" value="0x0D92A000" />
+        <register type="NOA" address="0x00009888" value="0x0F922000" />
+        <register type="NOA" address="0x00009888" value="0x13900180" />
+        <register type="NOA" address="0x00009888" value="0x21900181" />
+        <register type="NOA" address="0x00009888" value="0x23900182" />
+        <register type="NOA" address="0x00009888" value="0x25900183" />
+        <register type="NOA" address="0x00009888" value="0x27900184" />
+        <register type="NOA" address="0x00009888" value="0x29900185" />
+        <register type="NOA" address="0x00009888" value="0x2B900186" />
+        <register type="NOA" address="0x00009888" value="0x2D900187" />
+        <register type="NOA" address="0x00009888" value="0x2F900170" />
+        <register type="NOA" address="0x00009888" value="0x31900125" />
+        <register type="NOA" address="0x00009888" value="0x15900123" />
+        <register type="NOA" address="0x00009888" value="0x17900121" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B908000" />
+        <register type="NOA" address="0x00009888" value="0x1D908000" />
+        <register type="NOA" address="0x00009888" value="0x1F908000" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x43901084" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x47901080" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49901084" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x4B901084" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4D900004" />
+        <register type="NOA" address="0x00009888" value="0x45900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x0000272C" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002728" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x0000271C" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002718" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x0000274C" value="0x86543210" />
+        <register type="OA" address="0x00002748" value="0x86543210" />
+        <register type="OA" address="0x00002744" value="0x00006667" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x0000275C" value="0x86543210" />
+        <register type="OA" address="0x00002758" value="0x86543210" />
+        <register type="OA" address="0x00002754" value="0x00006465" />
+        <register type="OA" address="0x00002750" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007F81A" />
+        <register type="OA" address="0x00002774" value="0x0000FE00" />
+        <register type="OA" address="0x00002778" value="0x0007F82A" />
+        <register type="OA" address="0x0000277C" value="0x0000FE00" />
+        <register type="OA" address="0x00002780" value="0x0007F822" />
+        <register type="OA" address="0x00002784" value="0x0000FE00" />
+        <register type="OA" address="0x00002788" value="0x0007F8BA" />
+        <register type="OA" address="0x0000278C" value="0x0000FE00" />
+        <register type="OA" address="0x00002790" value="0x0007F87A" />
+        <register type="OA" address="0x00002794" value="0x0000FE00" />
+        <register type="OA" address="0x00002798" value="0x0007F8EA" />
+        <register type="OA" address="0x0000279C" value="0x0000FE00" />
+        <register type="OA" address="0x000027A0" value="0x0007F8E2" />
+        <register type="OA" address="0x000027A4" value="0x0000FE00" />
+        <register type="OA" address="0x000027A8" value="0x0007F8F2" />
+        <register type="OA" address="0x000027AC" value="0x0000FE00" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00015014" />
+        <register type="FLEX" address="0x0000E658" value="0x00025024" />
+        <register type="FLEX" address="0x0000E758" value="0x00035034" />
+        <register type="FLEX" address="0x0000E45C" value="0x00045044" />
+        <register type="FLEX" address="0x0000E55C" value="0x00055054" />
+        <register type="FLEX" address="0x0000E65C" value="0x00065064" />
+    </register_config>
+  </set>
+
+  <set name="Compute Metrics Extended Gen9"
+       mdapi_supported_apis="VK OGL4 OCL IO BB"
+       underscore_name="compute_extended"
+       hw_config_guid="bc9bcff2-459a-4cbc-986d-a84b077153f3"
+       chipset="GLK"
+       symbol_name="ComputeExtended"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu0_active"
+             units="percent"
+             symbol_name="Fpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active"
+             units="percent"
+             symbol_name="Fpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU AVG IPC Rate"
+             description="The average rate of IPC calculated for 2 FPU pipelines."
+             data_type="float"
+             max_equation="2"
+             equation="A 9 READ  A 10 READ  A 11 READ UADD  A 9 READ USUB FDIV 1 FADD"
+             underscore_name="eu_avg_ipc_rate"
+             units="number"
+             symbol_name="EuAvgIpcRate"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Typed Writes 0"
+             description="The subslice 0 typed writes."
+             data_type="uint64"
+             equation="C 0 READ"
+             underscore_name="typed_writes0"
+             units="messages"
+             symbol_name="TypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuTypedAtomics0"
+             description="The subslice 0 EU Typed Atomics subslice 0."
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="eu_typed_atomics0"
+             units="messages"
+             symbol_name="EuTypedAtomics0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Typed Atomics 0"
+             description="The subslice 0 typed atomics."
+             data_type="uint64"
+             equation="C 4 READ"
+             underscore_name="typed_atomics0"
+             units="messages"
+             symbol_name="TypedAtomics0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="TypedAtomicsPerCacheLine"
+             description="The ratio of EU typed atomics requests to L3 cache line writes."
+             data_type="float"
+             equation="$EuTypedAtomics0 $TypedAtomics0 FDIV"
+             underscore_name="typed_atomics_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="TypedAtomicsPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuUntypedReads0"
+             description="The subslice 0 EU Untyped Reads subslice 0."
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="eu_untyped_reads0"
+             units="messages"
+             symbol_name="EuUntypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Untyped Writes 0"
+             description="The subslice 0 untyped writes (including SLM writes)."
+             data_type="uint64"
+             equation="C 1 READ"
+             underscore_name="untyped_writes0"
+             units="messages"
+             symbol_name="UntypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuUntypedAtomics0"
+             description="The subslice 0 EU Untyped Atomics subslice 0."
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="eu_untyped_atomics0"
+             units="messages"
+             symbol_name="EuUntypedAtomics0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuUntypedWrites0"
+             description="The subslice 0 EU Untyped Writes subslice 0."
+             data_type="uint64"
+             equation="B 1 READ"
+             underscore_name="eu_untyped_writes0"
+             units="messages"
+             symbol_name="EuUntypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuA64UntypedWrites0"
+             description="The subslice 0 EU A64 Untyped Writes subslice 0."
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="eu_a64_untyped_writes0"
+             units="messages"
+             symbol_name="EuA64UntypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="UntypedWritesPerCacheLine"
+             description="The ratio of EU untyped write requests to L3 cache line writes."
+             data_type="float"
+             equation="$EuUntypedWrites0 $EuA64UntypedWrites0 UADD $UntypedWrites0 FDIV"
+             underscore_name="untyped_writes_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="UntypedWritesPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EuTypedWrites0"
+             description="The subslice 0 EU Typed Writes subslice 0."
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="eu_typed_writes0"
+             units="messages"
+             symbol_name="EuTypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="TypedWritesPerCacheLine"
+             description="The ratio of EU typed write requests to L3 cache line writes."
+             data_type="float"
+             equation="$EuTypedWrites0 $TypedWrites0 FDIV"
+             underscore_name="typed_writes_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="TypedWritesPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Typed Reads 0"
+             description="The subslice 0 typed reads."
+             data_type="uint64"
+             equation="C 2 READ"
+             underscore_name="typed_reads0"
+             units="messages"
+             symbol_name="TypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Untyped Reads 0"
+             description="The subslice 0 untyped reads (including SLM reads)."
+             data_type="uint64"
+             equation="C 3 READ"
+             underscore_name="untyped_reads0"
+             units="messages"
+             symbol_name="UntypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuA64UntypedReads0"
+             description="The subslice 0 EU A64 Untyped Reads subslice 0."
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="eu_a64_untyped_reads0"
+             units="messages"
+             symbol_name="EuA64UntypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EU Thread Occupancy"
+             description="The percentage of time in which hardware threads occupied EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ 8 UMUL $EuCoresTotalCount UDIV $EuThreadsCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_thread_occupancy"
+             units="percent"
+             symbol_name="EuThreadOccupancy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EuTypedReads0"
+             description="The subslice 0 EU Typed Reads subslice 0."
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="eu_typed_reads0"
+             units="messages"
+             symbol_name="EuTypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="UntypedReadsPerCacheLine"
+             description="The ratio of EU untyped read requests to L3 cache line reads."
+             data_type="float"
+             equation="$EuUntypedReads0 $EuA64UntypedReads0 UADD $UntypedReads0 FDIV"
+             underscore_name="untyped_reads_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="UntypedReadsPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="TypedReadsPerCacheLine"
+             description="The ratio of EU typed read requests to L3 cache line reads."
+             data_type="float"
+             equation="$EuTypedReads0 $TypedReads0 FDIV"
+             underscore_name="typed_reads_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="TypedReadsPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="EU Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_send_active"
+             units="percent"
+             symbol_name="EuSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x104F00E0" />
+        <register type="NOA" address="0x00009888" value="0x141C0160" />
+        <register type="NOA" address="0x00009888" value="0x161C0015" />
+        <register type="NOA" address="0x00009888" value="0x181C0120" />
+        <register type="NOA" address="0x00009888" value="0x002D5000" />
+        <register type="NOA" address="0x00009888" value="0x062D4000" />
+        <register type="NOA" address="0x00009888" value="0x082D5000" />
+        <register type="NOA" address="0x00009888" value="0x0A2D5000" />
+        <register type="NOA" address="0x00009888" value="0x0C2D5000" />
+        <register type="NOA" address="0x00009888" value="0x0E2D5000" />
+        <register type="NOA" address="0x00009888" value="0x022D5000" />
+        <register type="NOA" address="0x00009888" value="0x042D5000" />
+        <register type="NOA" address="0x00009888" value="0x0C2E5400" />
+        <register type="NOA" address="0x00009888" value="0x0E2E5515" />
+        <register type="NOA" address="0x00009888" value="0x102E0155" />
+        <register type="NOA" address="0x00009888" value="0x044CC000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C4CC000" />
+        <register type="NOA" address="0x00009888" value="0x0E4CC000" />
+        <register type="NOA" address="0x00009888" value="0x104C8000" />
+        <register type="NOA" address="0x00009888" value="0x124C8000" />
+        <register type="NOA" address="0x00009888" value="0x144C8000" />
+        <register type="NOA" address="0x00009888" value="0x164C2000" />
+        <register type="NOA" address="0x00009888" value="0x064CC000" />
+        <register type="NOA" address="0x00009888" value="0x084CC000" />
+        <register type="NOA" address="0x00009888" value="0x004EA000" />
+        <register type="NOA" address="0x00009888" value="0x064E8000" />
+        <register type="NOA" address="0x00009888" value="0x084EA000" />
+        <register type="NOA" address="0x00009888" value="0x0A4EA000" />
+        <register type="NOA" address="0x00009888" value="0x0C4EA000" />
+        <register type="NOA" address="0x00009888" value="0x0E4EA000" />
+        <register type="NOA" address="0x00009888" value="0x024EA000" />
+        <register type="NOA" address="0x00009888" value="0x044EA000" />
+        <register type="NOA" address="0x00009888" value="0x0E4F4B41" />
+        <register type="NOA" address="0x00009888" value="0x004F4200" />
+        <register type="NOA" address="0x00009888" value="0x024F404C" />
+        <register type="NOA" address="0x00009888" value="0x1C4F0000" />
+        <register type="NOA" address="0x00009888" value="0x1A4F0000" />
+        <register type="NOA" address="0x00009888" value="0x001B4000" />
+        <register type="NOA" address="0x00009888" value="0x061B8000" />
+        <register type="NOA" address="0x00009888" value="0x081BC000" />
+        <register type="NOA" address="0x00009888" value="0x0A1BC000" />
+        <register type="NOA" address="0x00009888" value="0x0C1BC000" />
+        <register type="NOA" address="0x00009888" value="0x041BC000" />
+        <register type="NOA" address="0x00009888" value="0x001C0031" />
+        <register type="NOA" address="0x00009888" value="0x061C1900" />
+        <register type="NOA" address="0x00009888" value="0x081C1A33" />
+        <register type="NOA" address="0x00009888" value="0x0A1C1B35" />
+        <register type="NOA" address="0x00009888" value="0x0C1C3337" />
+        <register type="NOA" address="0x00009888" value="0x041C31C7" />
+        <register type="NOA" address="0x00009888" value="0x180F5000" />
+        <register type="NOA" address="0x00009888" value="0x1A0FA8AA" />
+        <register type="NOA" address="0x00009888" value="0x1C0F0AAA" />
+        <register type="NOA" address="0x00009888" value="0x182C8000" />
+        <register type="NOA" address="0x00009888" value="0x1C2C6AAA" />
+        <register type="NOA" address="0x00009888" value="0x1E2C0001" />
+        <register type="NOA" address="0x00009888" value="0x1A2C2950" />
+        <register type="NOA" address="0x00009888" value="0x01938000" />
+        <register type="NOA" address="0x00009888" value="0x0F938000" />
+        <register type="NOA" address="0x00009888" value="0x1993AAAA" />
+        <register type="NOA" address="0x00009888" value="0x03938000" />
+        <register type="NOA" address="0x00009888" value="0x05938000" />
+        <register type="NOA" address="0x00009888" value="0x07938000" />
+        <register type="NOA" address="0x00009888" value="0x09938000" />
+        <register type="NOA" address="0x00009888" value="0x0B938000" />
+        <register type="NOA" address="0x00009888" value="0x13904000" />
+        <register type="NOA" address="0x00009888" value="0x21904000" />
+        <register type="NOA" address="0x00009888" value="0x23904000" />
+        <register type="NOA" address="0x00009888" value="0x25904000" />
+        <register type="NOA" address="0x00009888" value="0x27904000" />
+        <register type="NOA" address="0x00009888" value="0x29904000" />
+        <register type="NOA" address="0x00009888" value="0x2B904000" />
+        <register type="NOA" address="0x00009888" value="0x2D904000" />
+        <register type="NOA" address="0x00009888" value="0x2F904000" />
+        <register type="NOA" address="0x00009888" value="0x31904000" />
+        <register type="NOA" address="0x00009888" value="0x15904000" />
+        <register type="NOA" address="0x00009888" value="0x17904000" />
+        <register type="NOA" address="0x00009888" value="0x19904000" />
+        <register type="NOA" address="0x00009888" value="0x1B904000" />
+        <register type="NOA" address="0x00009888" value="0x1D904000" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x43900420" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x47900000" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900000" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900400" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4D900001" />
+        <register type="NOA" address="0x00009888" value="0x45900001" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007FC2A" />
+        <register type="OA" address="0x00002774" value="0x0000BF00" />
+        <register type="OA" address="0x00002778" value="0x0007FC6A" />
+        <register type="OA" address="0x0000277C" value="0x0000BF00" />
+        <register type="OA" address="0x00002780" value="0x0007FC92" />
+        <register type="OA" address="0x00002784" value="0x0000BF00" />
+        <register type="OA" address="0x00002788" value="0x0007FCA2" />
+        <register type="OA" address="0x0000278C" value="0x0000BF00" />
+        <register type="OA" address="0x00002790" value="0x0007FC32" />
+        <register type="OA" address="0x00002794" value="0x0000BF00" />
+        <register type="OA" address="0x00002798" value="0x0007FC9A" />
+        <register type="OA" address="0x0000279C" value="0x0000BF00" />
+        <register type="OA" address="0x000027A0" value="0x0007FE6A" />
+        <register type="OA" address="0x000027A4" value="0x0000BF00" />
+        <register type="OA" address="0x000027A8" value="0x0007FE7A" />
+        <register type="OA" address="0x000027AC" value="0x0000BF00" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00000003" />
+        <register type="FLEX" address="0x0000E658" value="0x00002001" />
+        <register type="FLEX" address="0x0000E758" value="0x00778008" />
+        <register type="FLEX" address="0x0000E45C" value="0x00088078" />
+        <register type="FLEX" address="0x0000E55C" value="0x00808708" />
+        <register type="FLEX" address="0x0000E65C" value="0x00A08908" />
+    </register_config>
+  </set>
+
+  <set name="Compute Metrics L3 Cache Gen9"
+       mdapi_supported_apis="VK OGL4 OCL IO BB"
+       underscore_name="compute_l3_cache"
+       hw_config_guid="88ec931f-5b4a-453a-9db6-a61232b6143d"
+       chipset="GLK"
+       symbol_name="ComputeL3Cache"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Bank 03 Accesses"
+             description="The total number of accesses to L3 Bank 03."
+             data_type="uint64"
+             equation="B 3 READ 2 UMUL"
+             underscore_name="l3_bank03_accesses"
+             units="messages"
+             symbol_name="L3Bank03Accesses"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="L3 Accesses"
+             description="The total number of L3 accesses from all entities."
+             data_type="uint64"
+             equation="C 0 READ C 1 READ B 2 READ B 3 READ UADD UADD UADD 2 UMUL"
+             underscore_name="l3_accesses"
+             units="messages"
+             symbol_name="L3Accesses"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Sampler Throughput"
+             description="The total number of GPU memory bytes transferred between samplers and L3 caches."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 29 READ 64 UMUL"
+             underscore_name="l3_sampler_throughput"
+             units="bytes"
+             symbol_name="L3SamplerThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Sampler"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu0_active"
+             units="percent"
+             symbol_name="Fpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active"
+             units="percent"
+             symbol_name="Fpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU AVG IPC Rate"
+             description="The average rate of IPC calculated for 2 FPU pipelines."
+             data_type="float"
+             max_equation="2"
+             equation="A 9 READ  A 10 READ  A 11 READ UADD  A 9 READ USUB FDIV 1 FADD"
+             underscore_name="eu_avg_ipc_rate"
+             units="number"
+             symbol_name="EuAvgIpcRate"
+             semantic_type="ratio"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Binary Instruction"
+             description="The percentage of time in which execution units were actively processing binary instructions on FPU0."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_binary_fpu0_instruction"
+             units="percent"
+             symbol_name="EuBinaryFpu0Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="EU FPU0 Hybrid Instruction"
+             description="The percentage of time in which execution units were actively processing hybrid instructions on FPU0."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_hybrid_fpu0_instruction"
+             units="percent"
+             symbol_name="EuHybridFpu0Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Misses"
+             description="The total number of L3 misses."
+             data_type="uint64"
+             equation="C 4 READ C 5 READ UADD"
+             underscore_name="l3_misses"
+             units="messages"
+             symbol_name="L3Misses"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/TAG"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="L3 Bank 00 Accesses"
+             description="The total number of accesses to L3 Bank 00."
+             data_type="uint64"
+             equation="C 0 READ 2 UMUL"
+             underscore_name="l3_bank00_accesses"
+             units="messages"
+             symbol_name="L3Bank00Accesses"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="EU FPU0 Move Instruction"
+             description="The percentage of time in which execution units were actively processing move instructions on FPU0."
+             data_type="float"
+             max_equation="100"
+             equation="A 19 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_move_fpu0_instruction"
+             units="percent"
+             symbol_name="EuMoveFpu0Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU FPU1 Hybrid Instruction"
+             description="The percentage of time in which execution units were actively processing hybrid instructions on FPU1."
+             data_type="float"
+             max_equation="100"
+             equation="A 14 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_hybrid_fpu1_instruction"
+             units="percent"
+             symbol_name="EuHybridFpu1Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Read Throughput"
+             description="The total number of GPU memory bytes read from GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="C 6 READ 64 UMUL"
+             underscore_name="gti_read_throughput"
+             units="bytes"
+             symbol_name="GtiReadThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI L3 Throughput"
+             description="The total number of GPU memory bytes transferred between L3 caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 4 READ C 5 READ UADD 64 UMUL"
+             underscore_name="gti_l3_throughput"
+             units="bytes"
+             symbol_name="GtiL3Throughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Bank 00 IC Accesses"
+             description="The total number of accesses to L3 Bank 00 from IC cache."
+             data_type="uint64"
+             equation="B 0 READ B 1 READ UADD 2 UMUL $L3Bank00Accesses UMIN"
+             underscore_name="l3_bank00_ic_accesses"
+             units="messages"
+             symbol_name="L3Bank00IcAccesses"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3/IC"
+             />
+    <counter name="L3 Bank 00 IC Hits"
+             description="The total number of hits in L3 Bank 00 from IC cache."
+             data_type="uint64"
+             equation="B 1 READ 2 UMUL $L3Bank00IcAccesses UMIN"
+             underscore_name="l3_bank00_ic_hits"
+             units="messages"
+             symbol_name="L3Bank00IcHits"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3/IC"
+             />
+    <counter name="Sampler Accesses"
+             description="The total number of messages send to samplers."
+             data_type="uint64"
+             equation="A 28 READ"
+             underscore_name="sampler_accesses"
+             units="messages"
+             symbol_name="SamplerAccesses"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler"
+             />
+    <counter name="L3 Bank 01 Accesses"
+             description="The total number of accesses to L3 Bank 01."
+             data_type="uint64"
+             equation="C 1 READ 2 UMUL"
+             underscore_name="l3_bank01_accesses"
+             units="messages"
+             symbol_name="L3Bank01Accesses"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Ternary Instruction"
+             description="The percentage of time in which execution units were actively processing ternary instructions on FPU0."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_ternary_fpu0_instruction"
+             units="percent"
+             symbol_name="EuTernaryFpu0Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU FPU1 Move Instruction"
+             description="The percentage of time in which execution units were actively processing move instructions on FPU1."
+             data_type="float"
+             max_equation="100"
+             equation="A 20 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_move_fpu1_instruction"
+             units="percent"
+             symbol_name="EuMoveFpu1Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="L3 Bank 02 Accesses"
+             description="The total number of accesses to L3 Bank 02."
+             data_type="uint64"
+             equation="B 2 READ 2 UMUL"
+             underscore_name="l3_bank02_accesses"
+             units="messages"
+             symbol_name="L3Bank02Accesses"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="L3 Total Throughput"
+             description="The total number of GPU memory bytes transferred via L3."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="$L3Accesses 64 UMUL"
+             underscore_name="l3_total_throughput"
+             units="bytes"
+             symbol_name="L3TotalThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Write Throughput"
+             description="The total number of GPU memory bytes written to GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 32 UMUL"
+             equation="C 7 READ 64 UMUL"
+             underscore_name="gti_write_throughput"
+             units="bytes"
+             symbol_name="GtiWriteThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="EU FPU1 Binary Instruction"
+             description="The percentage of time in which execution units were actively processing binary instructions on FPU1."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_binary_fpu1_instruction"
+             units="percent"
+             symbol_name="EuBinaryFpu1Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Ternary Instruction"
+             description="The percentage of time in which execution units were actively processing ternary instructions on FPU1."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_ternary_fpu1_instruction"
+             units="percent"
+             symbol_name="EuTernaryFpu1Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_send_active"
+             units="percent"
+             symbol_name="EuSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x166C03B0" />
+        <register type="NOA" address="0x00009888" value="0x1593001E" />
+        <register type="NOA" address="0x00009888" value="0x3F900C00" />
+        <register type="NOA" address="0x00009888" value="0x41900000" />
+        <register type="NOA" address="0x00009888" value="0x002D1000" />
+        <register type="NOA" address="0x00009888" value="0x062D4000" />
+        <register type="NOA" address="0x00009888" value="0x082D5000" />
+        <register type="NOA" address="0x00009888" value="0x0E2D5000" />
+        <register type="NOA" address="0x00009888" value="0x0C2E0400" />
+        <register type="NOA" address="0x00009888" value="0x0E2E1500" />
+        <register type="NOA" address="0x00009888" value="0x102E0140" />
+        <register type="NOA" address="0x00009888" value="0x044C4000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C4CC000" />
+        <register type="NOA" address="0x00009888" value="0x144C8000" />
+        <register type="NOA" address="0x00009888" value="0x164C2000" />
+        <register type="NOA" address="0x00009888" value="0x004E2000" />
+        <register type="NOA" address="0x00009888" value="0x064E8000" />
+        <register type="NOA" address="0x00009888" value="0x084EA000" />
+        <register type="NOA" address="0x00009888" value="0x0E4EA000" />
+        <register type="NOA" address="0x00009888" value="0x1A4F4001" />
+        <register type="NOA" address="0x00009888" value="0x1C4F5005" />
+        <register type="NOA" address="0x00009888" value="0x006C0051" />
+        <register type="NOA" address="0x00009888" value="0x066C5000" />
+        <register type="NOA" address="0x00009888" value="0x086C5C5D" />
+        <register type="NOA" address="0x00009888" value="0x0E6C5E5F" />
+        <register type="NOA" address="0x00009888" value="0x106C0000" />
+        <register type="NOA" address="0x00009888" value="0x146C0000" />
+        <register type="NOA" address="0x00009888" value="0x1A6C0000" />
+        <register type="NOA" address="0x00009888" value="0x1C6C0000" />
+        <register type="NOA" address="0x00009888" value="0x180F1000" />
+        <register type="NOA" address="0x00009888" value="0x1A0FA800" />
+        <register type="NOA" address="0x00009888" value="0x1C0F0A00" />
+        <register type="NOA" address="0x00009888" value="0x182C4000" />
+        <register type="NOA" address="0x00009888" value="0x1C2C4015" />
+        <register type="NOA" address="0x00009888" value="0x1E2C0001" />
+        <register type="NOA" address="0x00009888" value="0x03931980" />
+        <register type="NOA" address="0x00009888" value="0x05930032" />
+        <register type="NOA" address="0x00009888" value="0x11930000" />
+        <register type="NOA" address="0x00009888" value="0x01938000" />
+        <register type="NOA" address="0x00009888" value="0x0F938000" />
+        <register type="NOA" address="0x00009888" value="0x1993A00A" />
+        <register type="NOA" address="0x00009888" value="0x07930000" />
+        <register type="NOA" address="0x00009888" value="0x09930000" />
+        <register type="NOA" address="0x00009888" value="0x1D900177" />
+        <register type="NOA" address="0x00009888" value="0x1F900178" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x13904000" />
+        <register type="NOA" address="0x00009888" value="0x21904000" />
+        <register type="NOA" address="0x00009888" value="0x23904000" />
+        <register type="NOA" address="0x00009888" value="0x25904000" />
+        <register type="NOA" address="0x00009888" value="0x2F904000" />
+        <register type="NOA" address="0x00009888" value="0x31904000" />
+        <register type="NOA" address="0x00009888" value="0x19904000" />
+        <register type="NOA" address="0x00009888" value="0x1B904000" />
+        <register type="NOA" address="0x00009888" value="0x53901000" />
+        <register type="NOA" address="0x00009888" value="0x43900000" />
+        <register type="NOA" address="0x00009888" value="0x55900111" />
+        <register type="NOA" address="0x00009888" value="0x47900001" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900000" />
+        <register type="NOA" address="0x00009888" value="0x4D900000" />
+        <register type="NOA" address="0x00009888" value="0x45900400" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x30800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x30800000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007FFFA" />
+        <register type="OA" address="0x00002774" value="0x0000FEFE" />
+        <register type="OA" address="0x00002778" value="0x0007FFFA" />
+        <register type="OA" address="0x0000277C" value="0x0000FEFD" />
+        <register type="OA" address="0x00002790" value="0x0007FFFA" />
+        <register type="OA" address="0x00002794" value="0x0000FBEF" />
+        <register type="OA" address="0x00002798" value="0x0007FFFA" />
+        <register type="OA" address="0x0000279C" value="0x0000FBDF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00000003" />
+        <register type="FLEX" address="0x0000E658" value="0x00002001" />
+        <register type="FLEX" address="0x0000E758" value="0x00101100" />
+        <register type="FLEX" address="0x0000E45C" value="0x00201200" />
+        <register type="FLEX" address="0x0000E55C" value="0x00301300" />
+        <register type="FLEX" address="0x0000E65C" value="0x00401400" />
+    </register_config>
+  </set>
+
+  <set name="Metric set HDCAndSF"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="hdc_and_sf"
+       hw_config_guid="0329ea02-ebb8-43f1-bf89-c5bdcccd3eb4"
+       chipset="GLK"
+       symbol_name="HDCAndSF"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="Polygon Data Ready"
+             description="The percentage of time in which geometry pipeline output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="poly_data_ready"
+             units="percent"
+             symbol_name="PolyDataReady"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe/Strip-Fans"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="HDC stalled by L3 (s0.ss1)"
+             description="Percentage of time when HDC has messges to L3, but it's stalled due to lack of credits (s0.ss1)"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ C 4 READ USUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader01_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader01AccessStalledOnL3"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="HDC stalled by L3 (s0.ss0)"
+             description="Percentage of time when HDC has messges to L3, but it's stalled due to lack of credits (s0.ss0)"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ C 6 READ USUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader00_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader00AccessStalledOnL3"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x104F0232" />
+        <register type="NOA" address="0x00009888" value="0x124F4640" />
+        <register type="NOA" address="0x00009888" value="0x11834400" />
+        <register type="NOA" address="0x00009888" value="0x022D4000" />
+        <register type="NOA" address="0x00009888" value="0x042D5000" />
+        <register type="NOA" address="0x00009888" value="0x062D1000" />
+        <register type="NOA" address="0x00009888" value="0x0E2E0055" />
+        <register type="NOA" address="0x00009888" value="0x064C8000" />
+        <register type="NOA" address="0x00009888" value="0x084CC000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C4000" />
+        <register type="NOA" address="0x00009888" value="0x024E8000" />
+        <register type="NOA" address="0x00009888" value="0x044EA000" />
+        <register type="NOA" address="0x00009888" value="0x064E2000" />
+        <register type="NOA" address="0x00009888" value="0x024F6100" />
+        <register type="NOA" address="0x00009888" value="0x044F416B" />
+        <register type="NOA" address="0x00009888" value="0x064F004B" />
+        <register type="NOA" address="0x00009888" value="0x1A4F0000" />
+        <register type="NOA" address="0x00009888" value="0x1A0F02A8" />
+        <register type="NOA" address="0x00009888" value="0x1A2C5500" />
+        <register type="NOA" address="0x00009888" value="0x0F808000" />
+        <register type="NOA" address="0x00009888" value="0x25810020" />
+        <register type="NOA" address="0x00009888" value="0x0F8305C0" />
+        <register type="NOA" address="0x00009888" value="0x07938000" />
+        <register type="NOA" address="0x00009888" value="0x09938000" />
+        <register type="NOA" address="0x00009888" value="0x0B938000" />
+        <register type="NOA" address="0x00009888" value="0x0D938000" />
+        <register type="NOA" address="0x00009888" value="0x1F951000" />
+        <register type="NOA" address="0x00009888" value="0x13920200" />
+        <register type="NOA" address="0x00009888" value="0x31908000" />
+        <register type="NOA" address="0x00009888" value="0x19904000" />
+        <register type="NOA" address="0x00009888" value="0x1B904000" />
+        <register type="NOA" address="0x00009888" value="0x1D904000" />
+        <register type="NOA" address="0x00009888" value="0x1F904000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x4D900003" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900000" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x47900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x10800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00000002" />
+        <register type="OA" address="0x00002774" value="0x0000FDFF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set L3_1"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="l3_1"
+       hw_config_guid="5e57a25a-1d18-4e94-b84b-08ea66751b8c"
+       chipset="GLK"
+       symbol_name="L3_1"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank1 Active"
+             description="The percentage of time in which slice0 L3 bank1 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank1_active"
+             units="percent"
+             symbol_name="L30Bank1Active"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="Slice0 L3 Bank1 Stalled"
+             description="The percentage of time in which slice0 L3 bank1 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank1_stalled"
+             units="percent"
+             symbol_name="L30Bank1Stalled"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank0 Active"
+             description="The percentage of time in which slice0 L3 bank0 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank0_active"
+             units="percent"
+             symbol_name="L30Bank0Active"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank0 Stalled"
+             description="The percentage of time in which slice0 L3 bank0 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank0_stalled"
+             units="percent"
+             symbol_name="L30Bank0Stalled"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x12643400" />
+        <register type="NOA" address="0x00009888" value="0x12653400" />
+        <register type="NOA" address="0x00009888" value="0x106C6800" />
+        <register type="NOA" address="0x00009888" value="0x126C001E" />
+        <register type="NOA" address="0x00009888" value="0x166C0010" />
+        <register type="NOA" address="0x00009888" value="0x0C2D5000" />
+        <register type="NOA" address="0x00009888" value="0x0E2D5000" />
+        <register type="NOA" address="0x00009888" value="0x002D4000" />
+        <register type="NOA" address="0x00009888" value="0x022D5000" />
+        <register type="NOA" address="0x00009888" value="0x042D5000" />
+        <register type="NOA" address="0x00009888" value="0x062D1000" />
+        <register type="NOA" address="0x00009888" value="0x102E0154" />
+        <register type="NOA" address="0x00009888" value="0x0C2E5000" />
+        <register type="NOA" address="0x00009888" value="0x0E2E0055" />
+        <register type="NOA" address="0x00009888" value="0x104C8000" />
+        <register type="NOA" address="0x00009888" value="0x124C8000" />
+        <register type="NOA" address="0x00009888" value="0x144C8000" />
+        <register type="NOA" address="0x00009888" value="0x164C2000" />
+        <register type="NOA" address="0x00009888" value="0x044C8000" />
+        <register type="NOA" address="0x00009888" value="0x064CC000" />
+        <register type="NOA" address="0x00009888" value="0x084CC000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C4000" />
+        <register type="NOA" address="0x00009888" value="0x0C4EA000" />
+        <register type="NOA" address="0x00009888" value="0x0E4EA000" />
+        <register type="NOA" address="0x00009888" value="0x004E8000" />
+        <register type="NOA" address="0x00009888" value="0x024EA000" />
+        <register type="NOA" address="0x00009888" value="0x044EA000" />
+        <register type="NOA" address="0x00009888" value="0x064E2000" />
+        <register type="NOA" address="0x00009888" value="0x1C4F5500" />
+        <register type="NOA" address="0x00009888" value="0x1A4F1554" />
+        <register type="NOA" address="0x00009888" value="0x0A640024" />
+        <register type="NOA" address="0x00009888" value="0x10640000" />
+        <register type="NOA" address="0x00009888" value="0x04640000" />
+        <register type="NOA" address="0x00009888" value="0x0C650024" />
+        <register type="NOA" address="0x00009888" value="0x10650000" />
+        <register type="NOA" address="0x00009888" value="0x06650000" />
+        <register type="NOA" address="0x00009888" value="0x0C6C5327" />
+        <register type="NOA" address="0x00009888" value="0x0E6C5425" />
+        <register type="NOA" address="0x00009888" value="0x006C2A00" />
+        <register type="NOA" address="0x00009888" value="0x026C285B" />
+        <register type="NOA" address="0x00009888" value="0x046C005C" />
+        <register type="NOA" address="0x00009888" value="0x1C6C0000" />
+        <register type="NOA" address="0x00009888" value="0x1A6C0900" />
+        <register type="NOA" address="0x00009888" value="0x1C0F0AA0" />
+        <register type="NOA" address="0x00009888" value="0x180F4000" />
+        <register type="NOA" address="0x00009888" value="0x1A0F02AA" />
+        <register type="NOA" address="0x00009888" value="0x1C2C5400" />
+        <register type="NOA" address="0x00009888" value="0x1E2C0001" />
+        <register type="NOA" address="0x00009888" value="0x1A2C5550" />
+        <register type="NOA" address="0x00009888" value="0x1993AA00" />
+        <register type="NOA" address="0x00009888" value="0x03938000" />
+        <register type="NOA" address="0x00009888" value="0x05938000" />
+        <register type="NOA" address="0x00009888" value="0x07938000" />
+        <register type="NOA" address="0x00009888" value="0x09938000" />
+        <register type="NOA" address="0x00009888" value="0x0B938000" />
+        <register type="NOA" address="0x00009888" value="0x0D938000" />
+        <register type="NOA" address="0x00009888" value="0x2B904000" />
+        <register type="NOA" address="0x00009888" value="0x2D904000" />
+        <register type="NOA" address="0x00009888" value="0x2F904000" />
+        <register type="NOA" address="0x00009888" value="0x31904000" />
+        <register type="NOA" address="0x00009888" value="0x15904000" />
+        <register type="NOA" address="0x00009888" value="0x17904000" />
+        <register type="NOA" address="0x00009888" value="0x19904000" />
+        <register type="NOA" address="0x00009888" value="0x1B904000" />
+        <register type="NOA" address="0x00009888" value="0x1D904000" />
+        <register type="NOA" address="0x00009888" value="0x1F904000" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900421" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4D900001" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x43900420" />
+        <register type="NOA" address="0x00009888" value="0x45900021" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x47900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002770" value="0x00100070" />
+        <register type="OA" address="0x00002774" value="0x0000FFF1" />
+        <register type="OA" address="0x00002778" value="0x00014002" />
+        <register type="OA" address="0x0000277C" value="0x0000C3FF" />
+        <register type="OA" address="0x00002780" value="0x00010002" />
+        <register type="OA" address="0x00002784" value="0x0000C7FF" />
+        <register type="OA" address="0x00002788" value="0x00004002" />
+        <register type="OA" address="0x0000278C" value="0x0000D3FF" />
+        <register type="OA" address="0x00002790" value="0x00100700" />
+        <register type="OA" address="0x00002794" value="0x0000FF1F" />
+        <register type="OA" address="0x00002798" value="0x00001402" />
+        <register type="OA" address="0x0000279C" value="0x0000FC3F" />
+        <register type="OA" address="0x000027A0" value="0x00001002" />
+        <register type="OA" address="0x000027A4" value="0x0000FC7F" />
+        <register type="OA" address="0x000027A8" value="0x00000402" />
+        <register type="OA" address="0x000027AC" value="0x0000FD3F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set RasterizerAndPixelBackend"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="rasterizer_and_pixel_backend"
+       hw_config_guid="f0652373-d361-426f-b36d-9ffec288bdc6"
+       chipset="GLK"
+       symbol_name="RasterizerAndPixelBackend"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Slice0 Pixel Values Ready"
+             description="The percentage of time in which slice0 pixel values are ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="pixel_values0_ready"
+             units="percent"
+             symbol_name="PixelValues0Ready"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="Slice0 Rasterizer Input Available"
+             description="The percentage of time in which slice0 rasterizer input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="rasterizer0_input_available"
+             units="percent"
+             symbol_name="Rasterizer0InputAvailable"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Slice0 Post-EarlyZ Pixel Data Ready"
+             description="The percentage of time in which slice0 post-EarlyZ pixel data is ready (after early Z tests have been applied)"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="pixel_data0_ready"
+             units="percent"
+             symbol_name="PixelData0Ready"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer/Early Depth Test"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 Rasterizer Output Ready"
+             description="The percentage of time in which slice0 rasterizer output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="rasterizer0_output_ready"
+             units="percent"
+             symbol_name="Rasterizer0OutputReady"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Slice0 PS Output Available"
+             description="The percentage of time in which slice0 PS output is available"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_output0_available"
+             units="percent"
+             symbol_name="PSOutput0Available"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x102D7800" />
+        <register type="NOA" address="0x00009888" value="0x122D79E0" />
+        <register type="NOA" address="0x00009888" value="0x0C2F0004" />
+        <register type="NOA" address="0x00009888" value="0x100E3800" />
+        <register type="NOA" address="0x00009888" value="0x180F0005" />
+        <register type="NOA" address="0x00009888" value="0x002D0940" />
+        <register type="NOA" address="0x00009888" value="0x022D802F" />
+        <register type="NOA" address="0x00009888" value="0x042D4013" />
+        <register type="NOA" address="0x00009888" value="0x062D1000" />
+        <register type="NOA" address="0x00009888" value="0x0E2E0050" />
+        <register type="NOA" address="0x00009888" value="0x022F0010" />
+        <register type="NOA" address="0x00009888" value="0x002F0000" />
+        <register type="NOA" address="0x00009888" value="0x084C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C4000" />
+        <register type="NOA" address="0x00009888" value="0x044E8000" />
+        <register type="NOA" address="0x00009888" value="0x064E2000" />
+        <register type="NOA" address="0x00009888" value="0x040E0480" />
+        <register type="NOA" address="0x00009888" value="0x000E0000" />
+        <register type="NOA" address="0x00009888" value="0x060F0027" />
+        <register type="NOA" address="0x00009888" value="0x100F0000" />
+        <register type="NOA" address="0x00009888" value="0x1A0F0040" />
+        <register type="NOA" address="0x00009888" value="0x03938000" />
+        <register type="NOA" address="0x00009888" value="0x05938000" />
+        <register type="NOA" address="0x00009888" value="0x07938000" />
+        <register type="NOA" address="0x00009888" value="0x09938000" />
+        <register type="NOA" address="0x00009888" value="0x0B938000" />
+        <register type="NOA" address="0x00009888" value="0x0D938000" />
+        <register type="NOA" address="0x00009888" value="0x15904000" />
+        <register type="NOA" address="0x00009888" value="0x17904000" />
+        <register type="NOA" address="0x00009888" value="0x19904000" />
+        <register type="NOA" address="0x00009888" value="0x1B904000" />
+        <register type="NOA" address="0x00009888" value="0x1D904000" />
+        <register type="NOA" address="0x00009888" value="0x1F904000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x439014A0" />
+        <register type="NOA" address="0x00009888" value="0x459000A4" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x47900001" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x30800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00000002" />
+        <register type="OA" address="0x00002774" value="0x0000EFFF" />
+        <register type="OA" address="0x00002778" value="0x00006000" />
+        <register type="OA" address="0x0000277C" value="0x0000F3FF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set Sampler"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="sampler"
+       hw_config_guid="6ac97d12-ce13-428a-b20c-6902bde2608b"
+       chipset="GLK"
+       symbol_name="Sampler"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 Subslice2 Input Available"
+             description="The percentage of time in which slice0 subslice2 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler02_input_available"
+             units="percent"
+             symbol_name="Sampler02InputAvailable"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 Subslice0 Input Available"
+             description="The percentage of time in which slice0 subslice0 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler00_input_available"
+             units="percent"
+             symbol_name="Sampler00InputAvailable"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="Slice0 Subslice2 Sampler Output Ready"
+             description="The percentage of time in which slice0 subslice2 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler02_output_ready"
+             units="percent"
+             symbol_name="Sampler02OutputReady"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Slice0 Subslice1 Input Available"
+             description="The percentage of time in which slice0 subslice1 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler01_input_available"
+             units="percent"
+             symbol_name="Sampler01InputAvailable"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Slice0 Subslice0 Sampler Output Ready"
+             description="The percentage of time in which slice0 subslice0 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler00_output_ready"
+             units="percent"
+             symbol_name="Sampler00OutputReady"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Slice0 Subslice1 Sampler Output Ready"
+             description="The percentage of time in which slice0 subslice1 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler01_output_ready"
+             units="percent"
+             symbol_name="Sampler01OutputReady"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x121300A0" />
+        <register type="NOA" address="0x00009888" value="0x141600AB" />
+        <register type="NOA" address="0x00009888" value="0x123300A0" />
+        <register type="NOA" address="0x00009888" value="0x143600AB" />
+        <register type="NOA" address="0x00009888" value="0x125300A0" />
+        <register type="NOA" address="0x00009888" value="0x145600AB" />
+        <register type="NOA" address="0x00009888" value="0x0C2D4000" />
+        <register type="NOA" address="0x00009888" value="0x0E2D5000" />
+        <register type="NOA" address="0x00009888" value="0x002D4000" />
+        <register type="NOA" address="0x00009888" value="0x022D5000" />
+        <register type="NOA" address="0x00009888" value="0x042D5000" />
+        <register type="NOA" address="0x00009888" value="0x062D1000" />
+        <register type="NOA" address="0x00009888" value="0x102E01A0" />
+        <register type="NOA" address="0x00009888" value="0x0C2E5000" />
+        <register type="NOA" address="0x00009888" value="0x0E2E0065" />
+        <register type="NOA" address="0x00009888" value="0x164C2000" />
+        <register type="NOA" address="0x00009888" value="0x044C8000" />
+        <register type="NOA" address="0x00009888" value="0x064CC000" />
+        <register type="NOA" address="0x00009888" value="0x084C4000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C4000" />
+        <register type="NOA" address="0x00009888" value="0x0E4E8000" />
+        <register type="NOA" address="0x00009888" value="0x004E8000" />
+        <register type="NOA" address="0x00009888" value="0x024EA000" />
+        <register type="NOA" address="0x00009888" value="0x044E2000" />
+        <register type="NOA" address="0x00009888" value="0x064E2000" />
+        <register type="NOA" address="0x00009888" value="0x1C0F0800" />
+        <register type="NOA" address="0x00009888" value="0x180F4000" />
+        <register type="NOA" address="0x00009888" value="0x1A0F023F" />
+        <register type="NOA" address="0x00009888" value="0x1E2C0003" />
+        <register type="NOA" address="0x00009888" value="0x1A2CC030" />
+        <register type="NOA" address="0x00009888" value="0x04132180" />
+        <register type="NOA" address="0x00009888" value="0x02130000" />
+        <register type="NOA" address="0x00009888" value="0x0C148000" />
+        <register type="NOA" address="0x00009888" value="0x0E142000" />
+        <register type="NOA" address="0x00009888" value="0x04148000" />
+        <register type="NOA" address="0x00009888" value="0x1E150140" />
+        <register type="NOA" address="0x00009888" value="0x1C150040" />
+        <register type="NOA" address="0x00009888" value="0x0C163000" />
+        <register type="NOA" address="0x00009888" value="0x0E160068" />
+        <register type="NOA" address="0x00009888" value="0x10160000" />
+        <register type="NOA" address="0x00009888" value="0x18160000" />
+        <register type="NOA" address="0x00009888" value="0x0A164000" />
+        <register type="NOA" address="0x00009888" value="0x04330043" />
+        <register type="NOA" address="0x00009888" value="0x02330000" />
+        <register type="NOA" address="0x00009888" value="0x0234A000" />
+        <register type="NOA" address="0x00009888" value="0x04342000" />
+        <register type="NOA" address="0x00009888" value="0x1C350015" />
+        <register type="NOA" address="0x00009888" value="0x02363460" />
+        <register type="NOA" address="0x00009888" value="0x10360000" />
+        <register type="NOA" address="0x00009888" value="0x04360000" />
+        <register type="NOA" address="0x00009888" value="0x06360000" />
+        <register type="NOA" address="0x00009888" value="0x08364000" />
+        <register type="NOA" address="0x00009888" value="0x06530043" />
+        <register type="NOA" address="0x00009888" value="0x02530000" />
+        <register type="NOA" address="0x00009888" value="0x0E548000" />
+        <register type="NOA" address="0x00009888" value="0x00548000" />
+        <register type="NOA" address="0x00009888" value="0x06542000" />
+        <register type="NOA" address="0x00009888" value="0x1E550400" />
+        <register type="NOA" address="0x00009888" value="0x1A552000" />
+        <register type="NOA" address="0x00009888" value="0x1C550100" />
+        <register type="NOA" address="0x00009888" value="0x0E563000" />
+        <register type="NOA" address="0x00009888" value="0x00563400" />
+        <register type="NOA" address="0x00009888" value="0x10560000" />
+        <register type="NOA" address="0x00009888" value="0x18560000" />
+        <register type="NOA" address="0x00009888" value="0x02560000" />
+        <register type="NOA" address="0x00009888" value="0x0C564000" />
+        <register type="NOA" address="0x00009888" value="0x1993A800" />
+        <register type="NOA" address="0x00009888" value="0x03938000" />
+        <register type="NOA" address="0x00009888" value="0x05938000" />
+        <register type="NOA" address="0x00009888" value="0x07938000" />
+        <register type="NOA" address="0x00009888" value="0x09938000" />
+        <register type="NOA" address="0x00009888" value="0x0B938000" />
+        <register type="NOA" address="0x00009888" value="0x0D938000" />
+        <register type="NOA" address="0x00009888" value="0x2D904000" />
+        <register type="NOA" address="0x00009888" value="0x2F904000" />
+        <register type="NOA" address="0x00009888" value="0x31904000" />
+        <register type="NOA" address="0x00009888" value="0x15904000" />
+        <register type="NOA" address="0x00009888" value="0x17904000" />
+        <register type="NOA" address="0x00009888" value="0x19904000" />
+        <register type="NOA" address="0x00009888" value="0x1B904000" />
+        <register type="NOA" address="0x00009888" value="0x1D904000" />
+        <register type="NOA" address="0x00009888" value="0x1F904000" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x4B9014A0" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4D900001" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x43900820" />
+        <register type="NOA" address="0x00009888" value="0x45901022" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x47900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x70800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x0000C000" />
+        <register type="OA" address="0x00002774" value="0x0000E7FF" />
+        <register type="OA" address="0x00002778" value="0x00003000" />
+        <register type="OA" address="0x0000277C" value="0x0000F9FF" />
+        <register type="OA" address="0x00002780" value="0x00000C00" />
+        <register type="OA" address="0x00002784" value="0x0000FE7F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set TDL_1"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="tdl_1"
+       hw_config_guid="59ea703a-9a35-4aed-a985-0d9ab7aceaba"
+       chipset="GLK"
+       symbol_name="TDL_1"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="NonPS Thread Ready For Dispatch on Slice0 Subslice2"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice2 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread02_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread02ReadyForDispatch"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="NonPS Thread Ready For Dispatch on Slice0 Subslice0"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice0 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread00_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread00ReadyForDispatch"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Subslice0"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice0 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread00_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread00ReadyForDispatch"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Subslice1"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice1 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread01_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread01ReadyForDispatch"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Subslice2"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice2 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread02_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread02ReadyForDispatch"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="NonPS Thread Ready For Dispatch on Slice0 Subslice1"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice1 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread01_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread01ReadyForDispatch"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x141A0000" />
+        <register type="NOA" address="0x00009888" value="0x143A0000" />
+        <register type="NOA" address="0x00009888" value="0x145A0000" />
+        <register type="NOA" address="0x00009888" value="0x0C2D4000" />
+        <register type="NOA" address="0x00009888" value="0x0E2D5000" />
+        <register type="NOA" address="0x00009888" value="0x002D4000" />
+        <register type="NOA" address="0x00009888" value="0x022D5000" />
+        <register type="NOA" address="0x00009888" value="0x042D5000" />
+        <register type="NOA" address="0x00009888" value="0x062D1000" />
+        <register type="NOA" address="0x00009888" value="0x102E0150" />
+        <register type="NOA" address="0x00009888" value="0x0C2E5000" />
+        <register type="NOA" address="0x00009888" value="0x0E2E006A" />
+        <register type="NOA" address="0x00009888" value="0x124C8000" />
+        <register type="NOA" address="0x00009888" value="0x144C8000" />
+        <register type="NOA" address="0x00009888" value="0x164C2000" />
+        <register type="NOA" address="0x00009888" value="0x044C8000" />
+        <register type="NOA" address="0x00009888" value="0x064C4000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C4000" />
+        <register type="NOA" address="0x00009888" value="0x0C4E8000" />
+        <register type="NOA" address="0x00009888" value="0x0E4EA000" />
+        <register type="NOA" address="0x00009888" value="0x004E8000" />
+        <register type="NOA" address="0x00009888" value="0x024E2000" />
+        <register type="NOA" address="0x00009888" value="0x064E2000" />
+        <register type="NOA" address="0x00009888" value="0x1C0F0BC0" />
+        <register type="NOA" address="0x00009888" value="0x180F4000" />
+        <register type="NOA" address="0x00009888" value="0x1A0F0302" />
+        <register type="NOA" address="0x00009888" value="0x1E2C0003" />
+        <register type="NOA" address="0x00009888" value="0x1A2C00F0" />
+        <register type="NOA" address="0x00009888" value="0x021A3080" />
+        <register type="NOA" address="0x00009888" value="0x041A31E5" />
+        <register type="NOA" address="0x00009888" value="0x02148000" />
+        <register type="NOA" address="0x00009888" value="0x0414A000" />
+        <register type="NOA" address="0x00009888" value="0x1C150054" />
+        <register type="NOA" address="0x00009888" value="0x06168000" />
+        <register type="NOA" address="0x00009888" value="0x08168000" />
+        <register type="NOA" address="0x00009888" value="0x0A168000" />
+        <register type="NOA" address="0x00009888" value="0x0C3A3280" />
+        <register type="NOA" address="0x00009888" value="0x0E3A0063" />
+        <register type="NOA" address="0x00009888" value="0x063A0061" />
+        <register type="NOA" address="0x00009888" value="0x023A0000" />
+        <register type="NOA" address="0x00009888" value="0x0C348000" />
+        <register type="NOA" address="0x00009888" value="0x0E342000" />
+        <register type="NOA" address="0x00009888" value="0x06342000" />
+        <register type="NOA" address="0x00009888" value="0x1E350140" />
+        <register type="NOA" address="0x00009888" value="0x1C350100" />
+        <register type="NOA" address="0x00009888" value="0x18360028" />
+        <register type="NOA" address="0x00009888" value="0x0C368000" />
+        <register type="NOA" address="0x00009888" value="0x0E5A3080" />
+        <register type="NOA" address="0x00009888" value="0x005A3280" />
+        <register type="NOA" address="0x00009888" value="0x025A0063" />
+        <register type="NOA" address="0x00009888" value="0x0E548000" />
+        <register type="NOA" address="0x00009888" value="0x00548000" />
+        <register type="NOA" address="0x00009888" value="0x02542000" />
+        <register type="NOA" address="0x00009888" value="0x1E550400" />
+        <register type="NOA" address="0x00009888" value="0x1A552000" />
+        <register type="NOA" address="0x00009888" value="0x1C550001" />
+        <register type="NOA" address="0x00009888" value="0x18560080" />
+        <register type="NOA" address="0x00009888" value="0x02568000" />
+        <register type="NOA" address="0x00009888" value="0x04568000" />
+        <register type="NOA" address="0x00009888" value="0x1993A800" />
+        <register type="NOA" address="0x00009888" value="0x03938000" />
+        <register type="NOA" address="0x00009888" value="0x05938000" />
+        <register type="NOA" address="0x00009888" value="0x07938000" />
+        <register type="NOA" address="0x00009888" value="0x09938000" />
+        <register type="NOA" address="0x00009888" value="0x0B938000" />
+        <register type="NOA" address="0x00009888" value="0x0D938000" />
+        <register type="NOA" address="0x00009888" value="0x2D904000" />
+        <register type="NOA" address="0x00009888" value="0x2F904000" />
+        <register type="NOA" address="0x00009888" value="0x31904000" />
+        <register type="NOA" address="0x00009888" value="0x15904000" />
+        <register type="NOA" address="0x00009888" value="0x17904000" />
+        <register type="NOA" address="0x00009888" value="0x19904000" />
+        <register type="NOA" address="0x00009888" value="0x1B904000" />
+        <register type="NOA" address="0x00009888" value="0x1D904000" />
+        <register type="NOA" address="0x00009888" value="0x1F904000" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900420" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4D900000" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x43900000" />
+        <register type="NOA" address="0x00009888" value="0x45901084" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x47900001" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x30800000" />
+        <register type="OA" address="0x00002770" value="0x00000002" />
+        <register type="OA" address="0x00002774" value="0x00007FFF" />
+        <register type="OA" address="0x00002778" value="0x00000000" />
+        <register type="OA" address="0x0000277C" value="0x00009FFF" />
+        <register type="OA" address="0x00002780" value="0x00000002" />
+        <register type="OA" address="0x00002784" value="0x0000EFFF" />
+        <register type="OA" address="0x00002788" value="0x00000000" />
+        <register type="OA" address="0x0000278C" value="0x0000F3FF" />
+        <register type="OA" address="0x00002790" value="0x00000002" />
+        <register type="OA" address="0x00002794" value="0x0000FDFF" />
+        <register type="OA" address="0x00002798" value="0x00000000" />
+        <register type="OA" address="0x0000279C" value="0x0000FE7F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set TDL_2"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="tdl_2"
+       hw_config_guid="f2d6d718-e7b1-48f4-9624-45230d2fe2a0"
+       chipset="GLK"
+       symbol_name="TDL_2"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice1 Port 0"
+             description="The percentage of time in which thread header is ready on slice0 subslice1 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header01_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader01ReadyPort0"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice1 Port 1"
+             description="The percentage of time in which thread header is ready on slice0 subslice1 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header01_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader01ReadyPort1"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice2 Port 1"
+             description="The percentage of time in which thread header is ready on slice0 subslice2 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header02_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader02ReadyPort1"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice2 Port 0"
+             description="The percentage of time in which thread header is ready on slice0 subslice2 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header02_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader02ReadyPort0"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice0 Port 0"
+             description="The percentage of time in which thread header is ready on slice0 subslice0 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header00_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader00ReadyPort0"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice0 Port 1"
+             description="The percentage of time in which thread header is ready on slice0 subslice0 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header00_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader00ReadyPort1"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x141A026B" />
+        <register type="NOA" address="0x00009888" value="0x143A0173" />
+        <register type="NOA" address="0x00009888" value="0x145A026B" />
+        <register type="NOA" address="0x00009888" value="0x002D4000" />
+        <register type="NOA" address="0x00009888" value="0x022D5000" />
+        <register type="NOA" address="0x00009888" value="0x042D5000" />
+        <register type="NOA" address="0x00009888" value="0x062D1000" />
+        <register type="NOA" address="0x00009888" value="0x0C2E5000" />
+        <register type="NOA" address="0x00009888" value="0x0E2E0069" />
+        <register type="NOA" address="0x00009888" value="0x044C8000" />
+        <register type="NOA" address="0x00009888" value="0x064CC000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C4000" />
+        <register type="NOA" address="0x00009888" value="0x004E8000" />
+        <register type="NOA" address="0x00009888" value="0x024EA000" />
+        <register type="NOA" address="0x00009888" value="0x064E2000" />
+        <register type="NOA" address="0x00009888" value="0x180F6000" />
+        <register type="NOA" address="0x00009888" value="0x1A0F030A" />
+        <register type="NOA" address="0x00009888" value="0x1A2C03C0" />
+        <register type="NOA" address="0x00009888" value="0x041A37E7" />
+        <register type="NOA" address="0x00009888" value="0x021A0000" />
+        <register type="NOA" address="0x00009888" value="0x0414A000" />
+        <register type="NOA" address="0x00009888" value="0x1C150050" />
+        <register type="NOA" address="0x00009888" value="0x08168000" />
+        <register type="NOA" address="0x00009888" value="0x0A168000" />
+        <register type="NOA" address="0x00009888" value="0x003A3380" />
+        <register type="NOA" address="0x00009888" value="0x063A006F" />
+        <register type="NOA" address="0x00009888" value="0x023A0000" />
+        <register type="NOA" address="0x00009888" value="0x00348000" />
+        <register type="NOA" address="0x00009888" value="0x06342000" />
+        <register type="NOA" address="0x00009888" value="0x1A352000" />
+        <register type="NOA" address="0x00009888" value="0x1C350100" />
+        <register type="NOA" address="0x00009888" value="0x02368000" />
+        <register type="NOA" address="0x00009888" value="0x0C368000" />
+        <register type="NOA" address="0x00009888" value="0x025A37E7" />
+        <register type="NOA" address="0x00009888" value="0x0254A000" />
+        <register type="NOA" address="0x00009888" value="0x1C550005" />
+        <register type="NOA" address="0x00009888" value="0x04568000" />
+        <register type="NOA" address="0x00009888" value="0x06568000" />
+        <register type="NOA" address="0x00009888" value="0x03938000" />
+        <register type="NOA" address="0x00009888" value="0x05938000" />
+        <register type="NOA" address="0x00009888" value="0x07938000" />
+        <register type="NOA" address="0x00009888" value="0x09938000" />
+        <register type="NOA" address="0x00009888" value="0x0B938000" />
+        <register type="NOA" address="0x00009888" value="0x0D938000" />
+        <register type="NOA" address="0x00009888" value="0x15904000" />
+        <register type="NOA" address="0x00009888" value="0x17904000" />
+        <register type="NOA" address="0x00009888" value="0x19904000" />
+        <register type="NOA" address="0x00009888" value="0x1B904000" />
+        <register type="NOA" address="0x00009888" value="0x1D904000" />
+        <register type="NOA" address="0x00009888" value="0x1F904000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x43900020" />
+        <register type="NOA" address="0x00009888" value="0x45901080" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x47900001" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Compute Metrics Extra Gen9"
+       mdapi_supported_apis="VK OGL4 OCL IO BB"
+       underscore_name="compute_extra"
+       hw_config_guid="15274c82-27d2-4819-876a-7cb1a2c59ba4"
+       chipset="GLK"
+       symbol_name="ComputeExtra"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active"
+             units="percent"
+             symbol_name="Fpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Pipe Active including Ext Math"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing including Extended Math processing"
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ  C 7 READ C 6 READ FADD C 5 READ FADD 8 FMUL FADD 100 FMUL $EuCoresTotalCount FDIV $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active_adjusted"
+             units="percent"
+             symbol_name="Fpu1ActiveAdjusted"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x141A001F" />
+        <register type="NOA" address="0x00009888" value="0x143A001F" />
+        <register type="NOA" address="0x00009888" value="0x145A001F" />
+        <register type="NOA" address="0x00009888" value="0x042D5000" />
+        <register type="NOA" address="0x00009888" value="0x062D1000" />
+        <register type="NOA" address="0x00009888" value="0x0E2E0094" />
+        <register type="NOA" address="0x00009888" value="0x084CC000" />
+        <register type="NOA" address="0x00009888" value="0x044EA000" />
+        <register type="NOA" address="0x00009888" value="0x1A0F00E0" />
+        <register type="NOA" address="0x00009888" value="0x1A2C0C00" />
+        <register type="NOA" address="0x00009888" value="0x061A0063" />
+        <register type="NOA" address="0x00009888" value="0x021A0000" />
+        <register type="NOA" address="0x00009888" value="0x06142000" />
+        <register type="NOA" address="0x00009888" value="0x1C150100" />
+        <register type="NOA" address="0x00009888" value="0x0C168000" />
+        <register type="NOA" address="0x00009888" value="0x043A3180" />
+        <register type="NOA" address="0x00009888" value="0x023A0000" />
+        <register type="NOA" address="0x00009888" value="0x04348000" />
+        <register type="NOA" address="0x00009888" value="0x1C350040" />
+        <register type="NOA" address="0x00009888" value="0x0A368000" />
+        <register type="NOA" address="0x00009888" value="0x045A0063" />
+        <register type="NOA" address="0x00009888" value="0x025A0000" />
+        <register type="NOA" address="0x00009888" value="0x04542000" />
+        <register type="NOA" address="0x00009888" value="0x1C550010" />
+        <register type="NOA" address="0x00009888" value="0x08568000" />
+        <register type="NOA" address="0x00009888" value="0x09938000" />
+        <register type="NOA" address="0x00009888" value="0x0B938000" />
+        <register type="NOA" address="0x00009888" value="0x0D938000" />
+        <register type="NOA" address="0x00009888" value="0x1B904000" />
+        <register type="NOA" address="0x00009888" value="0x1D904000" />
+        <register type="NOA" address="0x00009888" value="0x1F904000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900400" />
+        <register type="NOA" address="0x00009888" value="0x47900004" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00001000" />
+        <register type="FLEX" address="0x0000E558" value="0x00003002" />
+        <register type="FLEX" address="0x0000E658" value="0x00005004" />
+        <register type="FLEX" address="0x0000E758" value="0x00011010" />
+        <register type="FLEX" address="0x0000E45C" value="0x00050012" />
+        <register type="FLEX" address="0x0000E55C" value="0x00052051" />
+        <register type="FLEX" address="0x0000E65C" value="0x00000008" />
+    </register_config>
+  </set>
+
+  <set name="MDAPI testing set Gen9"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="test_oa"
+       hw_config_guid="dd3fd789-e783-4204-8cd0-b671bbccb0cf"
+       chipset="GLK"
+       symbol_name="TestOa"
+       >
+    <counter name="TestCounter7"
+             description="HW test counter 7. Factor: 0.666"
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="counter7"
+             units="events"
+             symbol_name="Counter7"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="TestCounter8"
+             description="HW test counter 8. Should be equal to 1."
+             data_type="uint64"
+             equation="C 7 READ"
+             underscore_name="counter8"
+             units="events"
+             symbol_name="Counter8"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter4"
+             description="HW test counter 4. Factor: 0.333"
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="counter4"
+             units="events"
+             symbol_name="Counter4"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter5"
+             description="HW test counter 5. Factor: 0.333"
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="counter5"
+             units="events"
+             symbol_name="Counter5"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter6"
+             description="HW test counter 6. Factor: 0.166"
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="counter6"
+             units="events"
+             symbol_name="Counter6"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter3"
+             description="HW test counter 3. Factor: 0.5"
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="counter3"
+             units="events"
+             symbol_name="Counter3"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter0"
+             description="HW test counter 0. Factor: 0.0"
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="counter0"
+             units="events"
+             symbol_name="Counter0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter1"
+             description="HW test counter 1. Factor: 1.0"
+             data_type="uint64"
+             equation="B 1 READ"
+             underscore_name="counter1"
+             units="events"
+             symbol_name="Counter1"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter2"
+             description="HW test counter 2. Factor: 1.0"
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="counter2"
+             units="events"
+             symbol_name="Counter2"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x19800000" />
+        <register type="NOA" address="0x00009888" value="0x07800063" />
+        <register type="NOA" address="0x00009888" value="0x11800000" />
+        <register type="NOA" address="0x00009888" value="0x23810008" />
+        <register type="NOA" address="0x00009888" value="0x1D950400" />
+        <register type="NOA" address="0x00009888" value="0x0F922000" />
+        <register type="NOA" address="0x00009888" value="0x1F908000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x47900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x00000004" />
+        <register type="OA" address="0x00002774" value="0x00000000" />
+        <register type="OA" address="0x00002778" value="0x00000003" />
+        <register type="OA" address="0x0000277C" value="0x00000000" />
+        <register type="OA" address="0x00002780" value="0x00000007" />
+        <register type="OA" address="0x00002784" value="0x00000000" />
+        <register type="OA" address="0x00002788" value="0x00100002" />
+        <register type="OA" address="0x0000278C" value="0x0000FFF7" />
+        <register type="OA" address="0x00002790" value="0x00100002" />
+        <register type="OA" address="0x00002794" value="0x0000FFCF" />
+        <register type="OA" address="0x00002798" value="0x00100082" />
+        <register type="OA" address="0x0000279C" value="0x0000FFEF" />
+        <register type="OA" address="0x000027A0" value="0x001000C2" />
+        <register type="OA" address="0x000027A4" value="0x0000FFE7" />
+        <register type="OA" address="0x000027A8" value="0x00100001" />
+        <register type="OA" address="0x000027AC" value="0x0000FFE7" />
+    </register_config>
+  </set>
+
+  <set name="Metric set PMA Stall"
+       mdapi_supported_apis="VK OGL OGL4 OCL IO MEDIA"
+       underscore_name="pma__stall"
+       hw_config_guid="e6868953-fb47-431d-a060-f785916558fc"
+       chipset="GLK"
+       symbol_name="PMA_Stall"
+       >
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="STC PMA stall"
+             description="Percentage of time when stencil cache line and an overlapping pixel are causing stalls"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ B 1 READ FADD 2 FDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="stc_pma_stall"
+             units="percent"
+             symbol_name="StcPMAStall"
+             availability="$SliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_group="GPU/Stencil Cache"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x124C3080" />
+        <register type="NOA" address="0x00009888" value="0x002D1000" />
+        <register type="NOA" address="0x00009888" value="0x062D4000" />
+        <register type="NOA" address="0x00009888" value="0x082D5000" />
+        <register type="NOA" address="0x00009888" value="0x0A2D5000" />
+        <register type="NOA" address="0x00009888" value="0x0C2E0400" />
+        <register type="NOA" address="0x00009888" value="0x0E2E5500" />
+        <register type="NOA" address="0x00009888" value="0x102E0001" />
+        <register type="NOA" address="0x00009888" value="0x004C0045" />
+        <register type="NOA" address="0x00009888" value="0x064C2300" />
+        <register type="NOA" address="0x00009888" value="0x084C26C4" />
+        <register type="NOA" address="0x00009888" value="0x0A4C264E" />
+        <register type="NOA" address="0x00009888" value="0x164C0000" />
+        <register type="NOA" address="0x00009888" value="0x044C0000" />
+        <register type="NOA" address="0x00009888" value="0x0C4C0000" />
+        <register type="NOA" address="0x00009888" value="0x0E4C0000" />
+        <register type="NOA" address="0x00009888" value="0x01938000" />
+        <register type="NOA" address="0x00009888" value="0x0F938000" />
+        <register type="NOA" address="0x00009888" value="0x199300AA" />
+        <register type="NOA" address="0x00009888" value="0x13904000" />
+        <register type="NOA" address="0x00009888" value="0x21904000" />
+        <register type="NOA" address="0x00009888" value="0x23904000" />
+        <register type="NOA" address="0x00009888" value="0x25904000" />
+        <register type="NOA" address="0x00009888" value="0x27904000" />
+        <register type="NOA" address="0x00009888" value="0x29904000" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x43900000" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x47900000" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x30800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00E00021" />
+        <register type="OA" address="0x00002774" value="0x0007FFF8" />
+        <register type="OA" address="0x00002778" value="0x07000101" />
+        <register type="OA" address="0x0000277C" value="0x0038FFC7" />
+    </register_config>
+  </set>
+
+</metrics>
diff --git a/lib/i915/perf-configs/oa-hsw.xml b/lib/i915/perf-configs/oa-hsw.xml
new file mode 100644
index 00000000..a95c6f5a
--- /dev/null
+++ b/lib/i915/perf-configs/oa-hsw.xml
@@ -0,0 +1,4615 @@
+<?xml version="1.0"?>
+<metrics version="1562317146" merge_md5="">
+  <set name="Render Metrics Basic Gen7.5"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="render_basic"
+       hw_config_guid="a490e9d2-55b3-4db0-8dab-53011032c5f3"
+       chipset="HSW"
+       symbol_name="RenderBasic"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="C 2 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="TES EU Stall"
+             description="The percentage of time in which evaluation shaders were stalled on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ds_eu_stall"
+             units="percent"
+             symbol_name="DsEuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Evaluation Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="LLC GPU Accesses"
+             description="The total number of LLC cache lookups done from the GPU (64b reads, 32B writes)."
+             data_type="uint64"
+             equation="PERFCNT1 READ_REG"
+             underscore_name="llc_accesses"
+             units="messages"
+             symbol_name="LlcAccesses"
+             availability="true $QueryMode &&"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="LLC"
+             />
+    <counter name="Alpha Test Fails"
+             description="The total number of pixels dropped on post-FS alpha test."
+             data_type="uint64"
+             equation="A 37 READ"
+             underscore_name="alpha_test_fails"
+             units="pixels"
+             symbol_name="AlphaTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Sampler 1 Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which sampler 1 was bottlenecks."
+             data_type="float"
+             high_watermark="15"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="sampler1_bottleneck"
+             units="percent"
+             symbol_name="Sampler1Bottleneck"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="TES Threads Dispatched"
+             description="The total number of evaluation shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 15 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Evaluation Shader"
+             />
+    <counter name="TES AVG Active per Thread"
+             description="The average number of cycles per hardware thread run in which evaluation shaders were processed actively on the EUs."
+             data_type="uint64"
+             max_equation="100"
+             equation="A 12 READ $DsThreads UDIV"
+             underscore_name="ds_eu_active_per_thread"
+             units="cycles"
+             symbol_name="DsEuActivePerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="EU Array/Evaluation Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 25 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="GS EU Stall"
+             description="The percentage of time in which geometry shaders were stalled on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 23 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gs_eu_stall"
+             units="percent"
+             symbol_name="GsEuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Geometry Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="CS EU Active"
+             description="The percentage of time in which compute shaders were processed actively on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="cs_eu_active"
+             units="percent"
+             symbol_name="CsEuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Compute Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS EU Active"
+             description="The percentage of time in which vertex shaders were processed actively on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 2 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_eu_active"
+             units="percent"
+             symbol_name="VsEuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="TCS EU Active"
+             description="The percentage of time in which control shaders were processed actively on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="hs_eu_active"
+             units="percent"
+             symbol_name="HsEuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Control Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="TES EU Active"
+             description="The percentage of time in which evaluation shaders were processed actively on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ds_eu_active"
+             units="percent"
+             symbol_name="DsEuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Evaluation Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS EU Active"
+             description="The percentage of time in which geometry shaders were processed actively on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 22 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gs_eu_active"
+             units="percent"
+             symbol_name="GsEuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Geometry Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="FS EU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 27 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_active"
+             units="percent"
+             symbol_name="PsEuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="CS EU Stall"
+             description="The percentage of time in which compute shaders were stalled on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="cs_eu_stall"
+             units="percent"
+             symbol_name="CsEuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Compute Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 1 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS EU Stall"
+             description="The percentage of time in which vertex shaders were stalled on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 3 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_eu_stall"
+             units="percent"
+             symbol_name="VsEuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="TCS EU Stall"
+             description="The percentage of time in which control shaders were stalled on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="hs_eu_stall"
+             units="percent"
+             symbol_name="HsEuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Control Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="FS EU Stall"
+             description="The percentage of time in which fragment shaders were stalled on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 28 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_stall"
+             units="percent"
+             symbol_name="PsEuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="CS Duration"
+             description="Total Compute Shader GPU duration."
+             data_type="uint64"
+             equation="A 17 READ  A 0 READ UMUL  A 2 READ  A 7 READ UADD  A 12 READ UADD  A 17 READ UADD  A 22 READ UADD  A 27 READ UADD UDIV  A 18 READ  A 1 READ UMUL  A 3 READ  A 8 READ UADD  A 13 READ UADD  A 18 READ UADD  A 23 READ UADD  A 28 READ UADD UDIV UADD $GpuTime UMUL $GpuCoreClocks $EuCoresTotalCount UMUL 1000 UMUL UDIV"
+             underscore_name="cs_duration"
+             units="us"
+             symbol_name="CsDuration"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 30 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Sampler 0 Busy"
+             description="The percentage of time in which sampler 0 was busy."
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler0_busy"
+             units="percent"
+             symbol_name="Sampler0Busy"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Sampler 1 Busy"
+             description="The percentage of time in which sampler 1 was busy."
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler1_busy"
+             units="percent"
+             symbol_name="Sampler1Busy"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Samplers Busy"
+             description="The percentage of time in which samplers were busy."
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ  B 1 READ UADD $GpuCoreClocks FDIV 2 FDIV 100 FMUL"
+             underscore_name="samplers_busy"
+             units="percent"
+             symbol_name="SamplersBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="TES Duration"
+             description="Total Evaluation Shader GPU duration."
+             data_type="uint64"
+             equation="A 12 READ  A 0 READ UMUL  A 2 READ  A 7 READ UADD  A 12 READ UADD  A 17 READ UADD  A 22 READ UADD  A 27 READ UADD UDIV  A 13 READ  A 1 READ UMUL  A 3 READ  A 8 READ UADD  A 13 READ UADD  A 18 READ UADD  A 23 READ UADD  A 28 READ UADD UDIV UADD $GpuTime UMUL $GpuCoreClocks $EuCoresTotalCount UMUL 1000 UMUL UDIV"
+             underscore_name="ds_duration"
+             units="us"
+             symbol_name="DsDuration"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Evaluation Shader"
+             />
+    <counter name="GTI Fixed Pipe Throughput"
+             description="The total number of GPU memory bytes transferred between 3D Pipeline (Command Dispatch, Input Assembly and Stream Output) and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="C 1 READ 64 UMUL"
+             underscore_name="gti_vf_throughput"
+             units="bytes"
+             symbol_name="GtiVfThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/3D Pipe"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Read Throughput"
+             description="The total number of GPU memory bytes read from GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="C 6 READ 128 UMUL"
+             underscore_name="gti_read_throughput"
+             units="bytes"
+             symbol_name="GtiReadThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 20 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="CS AVG Active per Thread"
+             description="The average number of cycles per hardware thread run in which compute shaders were processed actively on the EUs."
+             data_type="uint64"
+             max_equation="100"
+             equation="A 17 READ $CsThreads UDIV"
+             underscore_name="cs_eu_active_per_thread"
+             units="cycles"
+             symbol_name="CsEuActivePerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="EU Array/Compute Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler 0 Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which sampler 0 was bottlenecks."
+             data_type="float"
+             high_watermark="15"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="sampler0_bottleneck"
+             units="percent"
+             symbol_name="Sampler0Bottleneck"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="GS AVG Stall per Thread"
+             description="The average number of cycles per hardware thread run in which geometry shaders were stalled on the EUs."
+             data_type="uint64"
+             equation="A 23 READ $GsThreads UDIV"
+             underscore_name="gs_eu_stall_per_thread"
+             units="cycles"
+             symbol_name="GsEuStallPerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Sampler 0 Texels LOD0"
+             description="The total number of texels lookups in LOD0 in sampler 0 unit."
+             data_type="uint64"
+             equation="B 4 READ 4 UMUL"
+             underscore_name="sampler0_texels"
+             units="texels"
+             symbol_name="Sampler0Texels"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="Sampler"
+             />
+    <counter name="Sampler 1 Texels LOD0"
+             description="The total number of texels lookups in LOD0 in sampler 1 unit."
+             data_type="uint64"
+             equation="B 5 READ 4 UMUL"
+             underscore_name="sampler1_texels"
+             units="texels"
+             symbol_name="Sampler1Texels"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="Sampler"
+             />
+    <counter name="Sampler Texels LOD0"
+             description="The total number of texels lookups in LOD0 in all sampler units."
+             data_type="uint64"
+             equation="$Sampler0Texels $Sampler1Texels UADD $EuSlicesTotalCount UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler"
+             />
+    <counter name="GS Duration"
+             description="Total Geometry Shader GPU duration."
+             data_type="uint64"
+             equation="A 22 READ  A 0 READ UMUL  A 2 READ  A 7 READ UADD  A 12 READ UADD  A 17 READ UADD  A 22 READ UADD  A 27 READ UADD UDIV  A 23 READ  A 1 READ UMUL  A 3 READ  A 8 READ UADD  A 13 READ UADD  A 18 READ UADD  A 23 READ UADD  A 28 READ UADD UDIV UADD $GpuTime UMUL $GpuCoreClocks $EuCoresTotalCount UMUL 1000 UMUL UDIV"
+             underscore_name="gs_duration"
+             units="us"
+             symbol_name="GsDuration"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Idle"
+             description="The percentage of time in which the Execution Units were idle."
+             data_type="float"
+             max_equation="100"
+             equation="100 $EuActive $EuStall FADD FSUB"
+             underscore_name="eu_idle"
+             units="percent"
+             symbol_name="EuIdle"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Depth Throughput"
+             description="The total number of GPU memory bytes transferred between depth caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 0 READ 64 UMUL"
+             underscore_name="gti_depth_throughput"
+             units="bytes"
+             symbol_name="GtiDepthThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/Depth Cache"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Write Throughput"
+             description="The total number of GPU memory bytes written to GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 32 UMUL"
+             equation="C 7 READ 64 UMUL"
+             underscore_name="gti_write_throughput"
+             units="bytes"
+             symbol_name="GtiWriteThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="FS AVG Stall per Thread"
+             description="The average number of cycles per hardware thread run in which fragment shaders were stalled on the EUs."
+             data_type="uint64"
+             equation="A 28 READ $PsThreads UDIV"
+             underscore_name="ps_eu_stall_per_thread"
+             units="cycles"
+             symbol_name="PsEuStallPerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="GTI L3 Throughput"
+             description="The total number of GPU memory bytes transferred between L3 caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 4 READ 64 UMUL"
+             underscore_name="gti_l3_throughput"
+             units="bytes"
+             symbol_name="GtiL3Throughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS AVG Stall per Thread"
+             description="The average number of cycles per hardware thread run in which vertex shaders were stalled on the EUs."
+             data_type="uint64"
+             equation="A 3 READ $VsThreads UDIV"
+             underscore_name="vs_eu_stall_per_thread"
+             units="cycles"
+             symbol_name="VsEuStallPerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="C 5 READ $EuSlicesTotalCount 4 UMUL UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has being processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 41 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="FS AVG Active per Thread"
+             description="The average number of cycles per hardware thread run in which fragment shaders were processed actively on the EUs."
+             data_type="uint64"
+             max_equation="100"
+             equation="A 27 READ $PsThreads UDIV"
+             underscore_name="ps_eu_active_per_thread"
+             units="cycles"
+             symbol_name="PsEuActivePerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="EU Array/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="TCS Duration"
+             description="Total Control Shader GPU duration."
+             data_type="uint64"
+             equation="A 7 READ  A 0 READ UMUL  A 2 READ  A 7 READ UADD  A 12 READ UADD  A 17 READ UADD  A 22 READ UADD  A 27 READ UADD UDIV  A 8 READ  A 1 READ UMUL  A 3 READ  A 8 READ UADD  A 13 READ UADD  A 18 READ UADD  A 23 READ UADD  A 28 READ UADD UDIV UADD $GpuTime UMUL $GpuCoreClocks $EuCoresTotalCount UMUL 1000 UMUL UDIV"
+             underscore_name="hs_duration"
+             units="us"
+             symbol_name="HsDuration"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Control Shader"
+             />
+    <counter name="TES AVG Stall per Thread"
+             description="The average number of cycles per hardware thread run in which evaluation shaders were stalled on the EUs."
+             data_type="uint64"
+             equation="A 13 READ $DsThreads UDIV"
+             underscore_name="ds_eu_stall_per_thread"
+             units="cycles"
+             symbol_name="DsEuStallPerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Evaluation Shader"
+             />
+    <counter name="GS AVG Active per Thread"
+             description="The average number of cycles per hardware thread run in which geometry shaders were processed actively on the EUs."
+             data_type="uint64"
+             max_equation="100"
+             equation="A 22 READ $GsThreads UDIV"
+             underscore_name="gs_eu_active_per_thread"
+             units="cycles"
+             symbol_name="GsEuActivePerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="EU Array/Geometry Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="TCS Threads Dispatched"
+             description="The total number of control shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 10 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Control Shader"
+             />
+    <counter name="TCS AVG Stall per Thread"
+             description="The average number of cycles per hardware thread run in which control shaders were stalled on the EUs."
+             data_type="uint64"
+             equation="A 8 READ $HsThreads UDIV"
+             underscore_name="hs_eu_stall_per_thread"
+             units="cycles"
+             symbol_name="HsEuStallPerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Control Shader"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 36 READ"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Late Depth Test Fails"
+             description="The total number of pixels dropped on post-FS depth test."
+             data_type="uint64"
+             equation="A 39 READ $SamplesKilledInPs USUB"
+             underscore_name="post_ps_depth_test_fails"
+             units="pixels"
+             symbol_name="PostPsDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Sampler Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which samplers were bottlenecks."
+             data_type="float"
+             high_watermark="15"
+             equation="$Sampler0Bottleneck $Sampler1Bottleneck FMAX"
+             max_equation="100"
+             underscore_name="sampler_bottleneck"
+             units="percent"
+             symbol_name="SamplerBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Indicate System Frame Batch Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="TCS AVG Active per Thread"
+             description="The average number of cycles per hardware thread run in which control shaders were processed actively on the EUs."
+             data_type="uint64"
+             max_equation="100"
+             equation="A 7 READ $HsThreads UDIV"
+             underscore_name="hs_eu_active_per_thread"
+             units="cycles"
+             symbol_name="HsEuActivePerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="EU Array/Control Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="FS Duration"
+             description="Total Fragment Shader GPU duration."
+             data_type="uint64"
+             equation="A 27 READ  A 0 READ UMUL  A 2 READ  A 7 READ UADD  A 12 READ UADD  A 17 READ UADD  A 22 READ UADD  A 27 READ UADD UDIV  A 28 READ  A 1 READ UMUL  A 3 READ  A 8 READ UADD  A 13 READ UADD  A 18 READ UADD  A 23 READ UADD  A 28 READ UADD UDIV UADD $GpuTime UMUL $GpuCoreClocks $EuCoresTotalCount UMUL 1000 UMUL UDIV"
+             underscore_name="ps_duration"
+             units="us"
+             symbol_name="PsDuration"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 33 READ"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="CS AVG Stall per Thread"
+             description="The average number of cycles per hardware thread run in which compute shaders were stalled on the EUs."
+             data_type="uint64"
+             equation="A 18 READ $CsThreads UDIV"
+             underscore_name="cs_eu_stall_per_thread"
+             units="cycles"
+             symbol_name="CsEuStallPerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="LLC GPU Hits"
+             description="The total number of successful LLC cache lookups done from the GPU."
+             data_type="uint64"
+             equation="PERFCNT2 READ_REG"
+             underscore_name="llc_hits"
+             units="messages"
+             symbol_name="LlcHits"
+             availability="true $QueryMode &&"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="LLC"
+             />
+    <counter name="Late Stencil Test Fails"
+             description="The total number of pixels dropped on post-FS stencil test."
+             data_type="uint64"
+             equation="A 38 READ"
+             underscore_name="post_ps_stencil_test_fails"
+             units="pixels"
+             symbol_name="PostPsStencilTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="LLC GPU Throughput"
+             description="The total number of GPU memory bytes transferred between GPU and LLC."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="PERFCNT1 READ_REG C 7 READ USUB 64 UMUL"
+             underscore_name="llc_gpu_throughput"
+             units="bytes"
+             symbol_name="LlcGpuThroughput"
+             availability="true $QueryMode &&"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="LLC"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI RCC Throughput"
+             description="The total number of GPU memory bytes transferred between render color caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 3 READ 64 UMUL"
+             underscore_name="gti_rcc_throughput"
+             units="bytes"
+             symbol_name="GtiRccThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/Color Cache"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Sampler Throughput"
+             description="The total number of GPU memory bytes transferred between samplers and L3 caches."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="B 6 READ B 7 READ UADD 2 UMUL $EuSlicesTotalCount UMUL 64 UMUL"
+             underscore_name="l3_sampler_throughput"
+             units="bytes"
+             symbol_name="L3SamplerThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Sampler"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS AVG Active per Thread"
+             description="The average number of cycles per hardware thread run in which vertex shaders were processed actively on the EUs."
+             data_type="uint64"
+             max_equation="100"
+             equation="A 2 READ $VsThreads UDIV"
+             underscore_name="vs_eu_active_per_thread"
+             units="cycles"
+             symbol_name="VsEuActivePerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Duration"
+             description="Total Vertex Shader GPU duration."
+             data_type="uint64"
+             equation="A 2 READ  A 0 READ UMUL  A 2 READ  A 7 READ UADD  A 12 READ UADD  A 17 READ UADD  A 22 READ UADD  A 27 READ UADD UDIV  A 3 READ  A 1 READ UMUL  A 3 READ  A 8 READ UADD  A 13 READ UADD  A 18 READ UADD  A 23 READ UADD  A 28 READ UADD UDIV UADD $GpuTime UMUL $GpuCoreClocks $EuCoresTotalCount UMUL 1000 UMUL UDIV"
+             underscore_name="vs_duration"
+             units="us"
+             symbol_name="VsDuration"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 40 READ"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x000253A4" value="0x01600000" />
+        <register type="NOA" address="0x00025440" value="0x00100000" />
+        <register type="NOA" address="0x00025128" value="0x00000000" />
+        <register type="NOA" address="0x0002691C" value="0x00000800" />
+        <register type="NOA" address="0x00026AA0" value="0x01500000" />
+        <register type="NOA" address="0x00026B9C" value="0x00006000" />
+        <register type="NOA" address="0x0002791C" value="0x00000800" />
+        <register type="NOA" address="0x00027AA0" value="0x01500000" />
+        <register type="NOA" address="0x00027B9C" value="0x00006000" />
+        <register type="NOA" address="0x0002641C" value="0x00000400" />
+        <register type="NOA" address="0x00025380" value="0x00000010" />
+        <register type="NOA" address="0x0002538C" value="0x00000000" />
+        <register type="NOA" address="0x00025384" value="0x0800AAAA" />
+        <register type="NOA" address="0x00025400" value="0x00000004" />
+        <register type="NOA" address="0x0002540C" value="0x06029000" />
+        <register type="NOA" address="0x00025410" value="0x00000002" />
+        <register type="NOA" address="0x00025404" value="0x5C30FFFF" />
+        <register type="NOA" address="0x00025100" value="0x00000016" />
+        <register type="NOA" address="0x00025110" value="0x00000400" />
+        <register type="NOA" address="0x00025104" value="0x00000000" />
+        <register type="NOA" address="0x00026804" value="0x00001211" />
+        <register type="NOA" address="0x00026884" value="0x00000100" />
+        <register type="NOA" address="0x00026900" value="0x00000002" />
+        <register type="NOA" address="0x00026908" value="0x00700000" />
+        <register type="NOA" address="0x00026904" value="0x00000000" />
+        <register type="NOA" address="0x00026984" value="0x00001022" />
+        <register type="NOA" address="0x00026A04" value="0x00000011" />
+        <register type="NOA" address="0x00026A80" value="0x00000006" />
+        <register type="NOA" address="0x00026A88" value="0x00000C02" />
+        <register type="NOA" address="0x00026A84" value="0x00000000" />
+        <register type="NOA" address="0x00026B04" value="0x00001000" />
+        <register type="NOA" address="0x00026B80" value="0x00000002" />
+        <register type="NOA" address="0x00026B8C" value="0x00000007" />
+        <register type="NOA" address="0x00026B84" value="0x00000000" />
+        <register type="NOA" address="0x00027804" value="0x00004844" />
+        <register type="NOA" address="0x00027884" value="0x00000400" />
+        <register type="NOA" address="0x00027900" value="0x00000002" />
+        <register type="NOA" address="0x00027908" value="0x0E000000" />
+        <register type="NOA" address="0x00027904" value="0x00000000" />
+        <register type="NOA" address="0x00027984" value="0x00004088" />
+        <register type="NOA" address="0x00027A04" value="0x00000044" />
+        <register type="NOA" address="0x00027A80" value="0x00000006" />
+        <register type="NOA" address="0x00027A88" value="0x00018040" />
+        <register type="NOA" address="0x00027A84" value="0x00000000" />
+        <register type="NOA" address="0x00027B04" value="0x00004000" />
+        <register type="NOA" address="0x00027B80" value="0x00000002" />
+        <register type="NOA" address="0x00027B8C" value="0x000000E0" />
+        <register type="NOA" address="0x00027B84" value="0x00000000" />
+        <register type="NOA" address="0x00026104" value="0x00002222" />
+        <register type="NOA" address="0x00026184" value="0x0C006666" />
+        <register type="NOA" address="0x00026284" value="0x04000000" />
+        <register type="NOA" address="0x00026304" value="0x04000000" />
+        <register type="NOA" address="0x00026400" value="0x00000002" />
+        <register type="NOA" address="0x00026410" value="0x000000A0" />
+        <register type="NOA" address="0x00026404" value="0x00000000" />
+        <register type="NOA" address="0x00025420" value="0x04108020" />
+        <register type="NOA" address="0x00025424" value="0x1284A420" />
+        <register type="NOA" address="0x0002541C" value="0x00000000" />
+        <register type="NOA" address="0x00025428" value="0x00042049" />
+        <register type="NOA" address="0x000091BC" value="0xE0400000" />
+        <register type="NOA" address="0x000091C4" value="0xE4500000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002724" value="0x00800000" /> <!--OASTARTTRIG6 -->
+        <register type="OA" address="0x00002720" value="0x00000000" /> <!--OASTARTTRIG1 -->
+        <register type="OA" address="0x00002714" value="0x00800000" /> <!--OASTARTTRIG1 -->
+        <register type="OA" address="0x00002710" value="0x00000000" /> <!--OASTARTTRIG1 -->
+    </register_config>
+  </set>
+
+  <set name="Compute Metrics Basic Gen7.5"
+       mdapi_supported_apis="OGL4 OCL IO BB"
+       underscore_name="compute_basic"
+       hw_config_guid="b344c8cb-a291-4cbf-aa9c-b40213bfc96f"
+       chipset="HSW"
+       symbol_name="ComputeBasic"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="C 2 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="TES EU Stall"
+             description="The percentage of time in which evaluation shaders were stalled on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ds_eu_stall"
+             units="percent"
+             symbol_name="DsEuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Evaluation Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="LLC GPU Accesses"
+             description="The total number of LLC cache lookups done from the GPU (64b reads, 32B writes)."
+             data_type="uint64"
+             equation="PERFCNT1 READ_REG"
+             underscore_name="llc_accesses"
+             units="messages"
+             symbol_name="LlcAccesses"
+             availability="true $QueryMode &&"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="LLC"
+             />
+    <counter name="Typed Bytes Written"
+             description="The total number of untyped memory bytes written via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="B 6 READ B 7 READ UADD $EuSlicesTotalCount 64 UMUL UMUL"
+             underscore_name="typed_bytes_written"
+             units="bytes"
+             symbol_name="TypedBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Alpha Test Fails"
+             description="The total number of pixels dropped on post-FS alpha test."
+             data_type="uint64"
+             equation="A 37 READ"
+             underscore_name="alpha_test_fails"
+             units="pixels"
+             symbol_name="AlphaTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="TCS Threads Dispatched"
+             description="The total number of control shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 10 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Control Shader"
+             />
+    <counter name="TCS AVG Active per Thread"
+             description="The average number of cycles per hardware thread run in which control shaders were processed actively on the EUs."
+             data_type="uint64"
+             max_equation="100"
+             equation="A 7 READ $HsThreads UDIV"
+             underscore_name="hs_eu_active_per_thread"
+             units="cycles"
+             symbol_name="HsEuActivePerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="EU Array/Control Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 25 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="GS EU Stall"
+             description="The percentage of time in which geometry shaders were stalled on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 23 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gs_eu_stall"
+             units="percent"
+             symbol_name="GsEuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Geometry Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 30 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 20 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="CS AVG Active per Thread"
+             description="The average number of cycles per hardware thread run in which compute shaders were processed actively on the EUs."
+             data_type="uint64"
+             max_equation="100"
+             equation="A 17 READ $CsThreads UDIV"
+             underscore_name="cs_eu_active_per_thread"
+             units="cycles"
+             symbol_name="CsEuActivePerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="EU Array/Compute Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Untyped Bytes Read"
+             description="The total number of typed memory bytes read via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="B 0 READ B 1 READ UADD $EuSlicesTotalCount 64 UMUL UMUL"
+             underscore_name="untyped_bytes_read"
+             units="bytes"
+             symbol_name="UntypedBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS AVG Stall per Thread"
+             description="The average number of cycles per hardware thread run in which geometry shaders were stalled on the EUs."
+             data_type="uint64"
+             equation="A 23 READ $GsThreads UDIV"
+             underscore_name="gs_eu_stall_per_thread"
+             units="cycles"
+             symbol_name="GsEuStallPerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Typed Atomics"
+             description="The total number of typed atomics."
+             data_type="uint64"
+             equation="C 0 READ C 1 READ UADD $EuSlicesTotalCount UMUL"
+             underscore_name="typed_atomics"
+             units="messages"
+             symbol_name="TypedAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 6 READ C 7 READ UADD $EuSlicesTotalCount 64 UMUL UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="FS AVG Stall per Thread"
+             description="The average number of cycles per hardware thread run in which fragment shaders were stalled on the EUs."
+             data_type="uint64"
+             equation="A 28 READ $PsThreads UDIV"
+             underscore_name="ps_eu_stall_per_thread"
+             units="cycles"
+             symbol_name="PsEuStallPerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="TES EU Active"
+             description="The percentage of time in which evaluation shaders were processed actively on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ds_eu_active"
+             units="percent"
+             symbol_name="DsEuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Evaluation Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS AVG Stall per Thread"
+             description="The average number of cycles per hardware thread run in which vertex shaders were stalled on the EUs."
+             data_type="uint64"
+             equation="A 3 READ $VsThreads UDIV"
+             underscore_name="vs_eu_stall_per_thread"
+             units="cycles"
+             symbol_name="VsEuStallPerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="TCS EU Stall"
+             description="The percentage of time in which control shaders were stalled on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="hs_eu_stall"
+             units="percent"
+             symbol_name="HsEuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Control Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has being processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 41 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="FS AVG Active per Thread"
+             description="The average number of cycles per hardware thread run in which fragment shaders were processed actively on the EUs."
+             data_type="uint64"
+             max_equation="100"
+             equation="A 27 READ $PsThreads UDIV"
+             underscore_name="ps_eu_active_per_thread"
+             units="cycles"
+             symbol_name="PsEuActivePerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="EU Array/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="TES Threads Dispatched"
+             description="The total number of evaluation shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 15 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Evaluation Shader"
+             />
+    <counter name="TES AVG Active per Thread"
+             description="The average number of cycles per hardware thread run in which evaluation shaders were processed actively on the EUs."
+             data_type="uint64"
+             max_equation="100"
+             equation="A 12 READ $DsThreads UDIV"
+             underscore_name="ds_eu_active_per_thread"
+             units="cycles"
+             symbol_name="DsEuActivePerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="EU Array/Evaluation Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS EU Active"
+             description="The percentage of time in which geometry shaders were processed actively on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 22 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gs_eu_active"
+             units="percent"
+             symbol_name="GsEuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Geometry Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="FS EU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 27 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_active"
+             units="percent"
+             symbol_name="PsEuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="TES AVG Stall per Thread"
+             description="The average number of cycles per hardware thread run in which evaluation shaders were stalled on the EUs."
+             data_type="uint64"
+             equation="A 13 READ $DsThreads UDIV"
+             underscore_name="ds_eu_stall_per_thread"
+             units="cycles"
+             symbol_name="DsEuStallPerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Evaluation Shader"
+             />
+    <counter name="GS AVG Active per Thread"
+             description="The average number of cycles per hardware thread run in which geometry shaders were processed actively on the EUs."
+             data_type="uint64"
+             max_equation="100"
+             equation="A 22 READ $GsThreads UDIV"
+             underscore_name="gs_eu_active_per_thread"
+             units="cycles"
+             symbol_name="GsEuActivePerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="EU Array/Geometry Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Untyped Writes"
+             description="The total number of untyped memory bytes written via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="B 2 READ B 3 READ UADD $EuSlicesTotalCount 64 UMUL UMUL"
+             underscore_name="untyped_bytes_written"
+             units="bytes"
+             symbol_name="UntypedBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of byten written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 4 READ C 5 READ UADD $EuSlicesTotalCount 64 UMUL UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="TCS AVG Stall per Thread"
+             description="The average number of cycles per hardware thread run in which control shaders were stalled on the EUs."
+             data_type="uint64"
+             equation="A 8 READ $HsThreads UDIV"
+             underscore_name="hs_eu_stall_per_thread"
+             units="cycles"
+             symbol_name="HsEuStallPerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Control Shader"
+             />
+    <counter name="TCS EU Active"
+             description="The percentage of time in which control shaders were processed actively on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="hs_eu_active"
+             units="percent"
+             symbol_name="HsEuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Control Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 36 READ"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Late Depth Test Fails"
+             description="The total number of pixels dropped on post-FS depth test."
+             data_type="uint64"
+             equation="A 39 READ $SamplesKilledInPs USUB"
+             underscore_name="post_ps_depth_test_fails"
+             units="pixels"
+             symbol_name="PostPsDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="FS EU Stall"
+             description="The percentage of time in which fragment shaders were stalled on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 28 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_stall"
+             units="percent"
+             symbol_name="PsEuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 1 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 33 READ"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS EU Active"
+             description="The percentage of time in which vertex shaders were processed actively on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 2 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_eu_active"
+             units="percent"
+             symbol_name="VsEuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="CS EU Active"
+             description="The percentage of time in which compute shaders were processed actively on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="cs_eu_active"
+             units="percent"
+             symbol_name="CsEuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Compute Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="CS AVG Stall per Thread"
+             description="The average number of cycles per hardware thread run in which compute shaders were stalled on the EUs."
+             data_type="uint64"
+             equation="A 18 READ $CsThreads UDIV"
+             underscore_name="cs_eu_stall_per_thread"
+             units="cycles"
+             symbol_name="CsEuStallPerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="LLC GPU Hits"
+             description="The total number of successful LLC cache lookups done from the GPU."
+             data_type="uint64"
+             equation="PERFCNT2 READ_REG"
+             underscore_name="llc_hits"
+             units="messages"
+             symbol_name="LlcHits"
+             availability="true $QueryMode &&"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="LLC"
+             />
+    <counter name="Late Stencil Test Fails"
+             description="The total number of pixels dropped on post-FS stencil test."
+             data_type="uint64"
+             equation="A 38 READ"
+             underscore_name="post_ps_stencil_test_fails"
+             units="pixels"
+             symbol_name="PostPsStencilTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="VS AVG Active per Thread"
+             description="The average number of cycles per hardware thread run in which vertex shaders were processed actively on the EUs."
+             data_type="uint64"
+             max_equation="100"
+             equation="A 2 READ $VsThreads UDIV"
+             underscore_name="vs_eu_active_per_thread"
+             units="cycles"
+             symbol_name="VsEuActivePerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="CS EU Stall"
+             description="The percentage of time in which compute shaders were stalled on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="cs_eu_stall"
+             units="percent"
+             symbol_name="CsEuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Compute Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Typed Bytes Read"
+             description="The total number of typed memory bytes read via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="B 4 READ B 5 READ UADD $EuSlicesTotalCount 64 UMUL UMUL"
+             underscore_name="typed_bytes_read"
+             units="bytes"
+             symbol_name="TypedBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 40 READ"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="VS EU Stall"
+             description="The percentage of time in which vertex shaders were stalled on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 3 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_eu_stall"
+             units="percent"
+             symbol_name="VsEuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x000253A4" value="0x00000000" />
+        <register type="NOA" address="0x0002681C" value="0x01F00800" />
+        <register type="NOA" address="0x00026820" value="0x00001000" />
+        <register type="NOA" address="0x0002781C" value="0x01F00800" />
+        <register type="NOA" address="0x00026520" value="0x00000007" />
+        <register type="NOA" address="0x000265A0" value="0x00000007" />
+        <register type="NOA" address="0x00025380" value="0x00000010" />
+        <register type="NOA" address="0x0002538C" value="0x00300000" />
+        <register type="NOA" address="0x00025384" value="0xAA8AAAAA" />
+        <register type="NOA" address="0x00025404" value="0xFFFFFFFF" />
+        <register type="NOA" address="0x00026800" value="0x00004202" />
+        <register type="NOA" address="0x00026808" value="0x00605817" />
+        <register type="NOA" address="0x0002680C" value="0x10001005" />
+        <register type="NOA" address="0x00026804" value="0x00000000" />
+        <register type="NOA" address="0x00027800" value="0x00000102" />
+        <register type="NOA" address="0x00027808" value="0x0C0701E0" />
+        <register type="NOA" address="0x0002780C" value="0x000200A0" />
+        <register type="NOA" address="0x00027804" value="0x00000000" />
+        <register type="NOA" address="0x00026484" value="0x44000000" />
+        <register type="NOA" address="0x00026704" value="0x44000000" />
+        <register type="NOA" address="0x00026500" value="0x00000006" />
+        <register type="NOA" address="0x00026510" value="0x00000001" />
+        <register type="NOA" address="0x00026504" value="0x88000000" />
+        <register type="NOA" address="0x00026580" value="0x00000006" />
+        <register type="NOA" address="0x00026590" value="0x00000020" />
+        <register type="NOA" address="0x00026584" value="0x00000000" />
+        <register type="NOA" address="0x00026104" value="0x55822222" />
+        <register type="NOA" address="0x00026184" value="0xAA866666" />
+        <register type="NOA" address="0x00025420" value="0x08320C83" />
+        <register type="NOA" address="0x00025424" value="0x06820C83" />
+        <register type="NOA" address="0x0002541C" value="0x00000000" />
+        <register type="NOA" address="0x00025428" value="0x00000C03" />
+        <register type="NOA" address="0x000091BC" value="0xE0400000" />
+        <register type="NOA" address="0x000091C4" value="0xE4500000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002710" value="0x00000000" /> <!--OASTARTTRIG1 -->
+        <register type="OA" address="0x00002714" value="0x00800000" /> <!--OASTARTTRIG1 -->
+        <register type="OA" address="0x00002718" value="0xAAAAAAAA" /> <!--OASTARTTRIG1 -->
+        <register type="OA" address="0x0000271C" value="0xAAAAAAAA" /> <!--OASTARTTRIG1 -->
+        <register type="OA" address="0x00002720" value="0x00000000" /> <!--OASTARTTRIG1 -->
+        <register type="OA" address="0x00002724" value="0x00800000" /> <!--OASTARTTRIG6 -->
+        <register type="OA" address="0x00002728" value="0xAAAAAAAA" /> <!--OASTARTTRIG7 -->
+        <register type="OA" address="0x0000272C" value="0xAAAAAAAA" /> <!--OASTARTTRIG8 -->
+        <register type="OA" address="0x00002740" value="0x00000000" /> <!--OAREPORTTRIG1 -->
+        <register type="OA" address="0x00002744" value="0x00000000" /> <!--OAREPORTTRIG2 -->
+        <register type="OA" address="0x00002748" value="0x00000000" /> <!--OAREPORTTRIG3 -->
+        <register type="OA" address="0x0000274C" value="0x00000000" /> <!--OAREPORTTRIG4 -->
+        <register type="OA" address="0x00002750" value="0x00000000" /> <!--OAREPORTTRIG5 -->
+        <register type="OA" address="0x00002754" value="0x00000000" /> <!--OAREPORTTRIG6 -->
+        <register type="OA" address="0x00002758" value="0x00000000" /> <!--OAREPORTTRIG7 -->
+        <register type="OA" address="0x0000275C" value="0x00000000" /> <!--OAREPORTTRIG8 -->
+    </register_config>
+  </set>
+
+  <set name="Compute Metrics Extended Gen7.5"
+       mdapi_supported_apis="OGL4 OCL IO BB"
+       underscore_name="compute_extended"
+       hw_config_guid="480f9795-cf6a-4204-a9e3-cd7015515f8d"
+       chipset="HSW"
+       symbol_name="ComputeExtended"
+       >
+    <counter name="EuUntypedWrites0"
+             description="The subslice 0 EU Untyped Writes subslice 0."
+             data_type="uint64"
+             equation="B 1 READ"
+             underscore_name="eu_untyped_writes0"
+             units="messages"
+             symbol_name="EuUntypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Untyped Writes 0"
+             description="The subslice 0 untyped writes (including SLM writes)."
+             data_type="uint64"
+             equation="C 1 READ"
+             underscore_name="untyped_writes0"
+             units="messages"
+             symbol_name="UntypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="UntypedWritesPerCacheLine"
+             description="The ratio of EU untyped write requests to L3 cache line writes."
+             data_type="float"
+             equation="$EuUntypedWrites0 $UntypedWrites0 FDIV"
+             underscore_name="untyped_writes_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="UntypedWritesPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="LLC GPU Accesses"
+             description="The total number of LLC cache lookups done from the GPU (64b reads, 32B writes)."
+             data_type="uint64"
+             equation="PERFCNT1 READ_REG"
+             underscore_name="llc_accesses"
+             units="messages"
+             symbol_name="LlcAccesses"
+             availability="true $QueryMode &&"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="LLC"
+             />
+    <counter name="Typed Reads 0"
+             description="The subslice 0 typed reads."
+             data_type="uint64"
+             equation="C 2 READ"
+             underscore_name="typed_reads0"
+             units="messages"
+             symbol_name="TypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Typed Writes 0"
+             description="The subslice 0 typed writes."
+             data_type="uint64"
+             equation="C 0 READ"
+             underscore_name="typed_writes0"
+             units="messages"
+             symbol_name="TypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuTypedAtomics0"
+             description="The subslice 0 EU Typed Atomics subslice 0."
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="eu_typed_atomics0"
+             units="messages"
+             symbol_name="EuTypedAtomics0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Typed Atomics 0"
+             description="The subslice 0 typed atomics."
+             data_type="uint64"
+             equation="C 4 READ"
+             underscore_name="typed_atomics0"
+             units="messages"
+             symbol_name="TypedAtomics0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="TypedAtomicsPerCacheLine"
+             description="The ratio of EU typed atomics requests to L3 cache line writes."
+             data_type="float"
+             equation="$EuTypedAtomics0 $TypedAtomics0 FDIV"
+             underscore_name="typed_atomics_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="TypedAtomicsPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuUntypedReads0"
+             description="The subslice 0 EU Untyped Reads subslice 0."
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="eu_untyped_reads0"
+             units="messages"
+             symbol_name="EuUntypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuUntypedAtomics0"
+             description="The subslice 0 EU Untyped Atomics subslice 0."
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="eu_untyped_atomics0"
+             units="messages"
+             symbol_name="EuUntypedAtomics0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="gpu_clocks"
+             units="cycles"
+             symbol_name="GpuClocks"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 20 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="EuTypedWrites0"
+             description="The subslice 0 EU Typed Writes subslice 0."
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="eu_typed_writes0"
+             units="messages"
+             symbol_name="EuTypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="TypedWritesPerCacheLine"
+             description="The ratio of EU typed write requests to L3 cache line writes."
+             data_type="float"
+             equation="$EuTypedWrites0 $TypedWrites0 FDIV"
+             underscore_name="typed_writes_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="TypedWritesPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="LLC GPU Hits"
+             description="The total number of successful LLC cache lookups done from the GPU."
+             data_type="uint64"
+             equation="PERFCNT2 READ_REG"
+             underscore_name="llc_hits"
+             units="messages"
+             symbol_name="LlcHits"
+             availability="true $QueryMode &&"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="LLC"
+             />
+    <counter name="EuTypedReads0"
+             description="The subslice 0 EU Typed Reads subslice 0."
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="eu_typed_reads0"
+             units="messages"
+             symbol_name="EuTypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuUrbAtomics0"
+             description="The subslice 0 EU URB Atomics subslice 0."
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="eu_urb_atomics0"
+             units="messages"
+             symbol_name="EuUrbAtomics0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Untyped Reads 0"
+             description="The subslice 0 untyped reads (including SLM reads)."
+             data_type="uint64"
+             equation="C 3 READ"
+             underscore_name="untyped_reads0"
+             units="messages"
+             symbol_name="UntypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="UntypedReadsPerCacheLine"
+             description="The ratio of EU untyped read requests to L3 cache line reads."
+             data_type="float"
+             equation="$EuUntypedReads0 $UntypedReads0 FDIV"
+             underscore_name="untyped_reads_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="UntypedReadsPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TypedReadsPerCacheLine"
+             description="The ratio of EU typed read requests to L3 cache line reads."
+             data_type="float"
+             equation="$EuTypedReads0 $TypedReads0 FDIV"
+             underscore_name="typed_reads_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="TypedReadsPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x0002681C" value="0x3EB00800" />
+        <register type="NOA" address="0x00026820" value="0x00900000" />
+        <register type="NOA" address="0x00025384" value="0x02AAAAAA" />
+        <register type="NOA" address="0x00025404" value="0x03FFFFFF" />
+        <register type="NOA" address="0x00026800" value="0x00142284" />
+        <register type="NOA" address="0x00026808" value="0x0E629062" />
+        <register type="NOA" address="0x0002680C" value="0x3F6F55CB" />
+        <register type="NOA" address="0x00026810" value="0x00000014" />
+        <register type="NOA" address="0x00026804" value="0x00000000" />
+        <register type="NOA" address="0x00026104" value="0x02AAAAAA" />
+        <register type="NOA" address="0x00026184" value="0x02AAAAAA" />
+        <register type="NOA" address="0x00025420" value="0x00000000" />
+        <register type="NOA" address="0x00025424" value="0x00000000" />
+        <register type="NOA" address="0x0002541C" value="0x00000000" />
+        <register type="NOA" address="0x00025428" value="0x00000000" />
+        <register type="NOA" address="0x000091BC" value="0xE0400000" />
+        <register type="NOA" address="0x000091C4" value="0xE4500000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002724" value="0xF0800000" /> <!--OASTARTTRIG6 -->
+        <register type="OA" address="0x00002720" value="0x00000000" /> <!--OASTARTTRIG1 -->
+        <register type="OA" address="0x00002714" value="0xF0800000" /> <!--OASTARTTRIG1 -->
+        <register type="OA" address="0x00002710" value="0x00000000" /> <!--OASTARTTRIG1 -->
+        <register type="OA" address="0x00002770" value="0x0007FE2A" /> <!--OACEC0_0 -->
+        <register type="OA" address="0x00002774" value="0x0000FF00" /> <!--OACEC0_1 -->
+        <register type="OA" address="0x00002778" value="0x0007FE6A" /> <!--OACEC1_0 -->
+        <register type="OA" address="0x0000277C" value="0x0000FF00" /> <!--OACEC1_1 -->
+        <register type="OA" address="0x00002780" value="0x0007FE92" /> <!--OACEC2_0 -->
+        <register type="OA" address="0x00002784" value="0x0000FF00" /> <!--OACEC2_1 -->
+        <register type="OA" address="0x00002788" value="0x0007FEA2" /> <!--OACEC3_0 -->
+        <register type="OA" address="0x0000278C" value="0x0000FF00" /> <!--OACEC3_1 -->
+        <register type="OA" address="0x00002790" value="0x0007FE32" /> <!--OACEC4_0 -->
+        <register type="OA" address="0x00002794" value="0x0000FF00" /> <!--OACEC4_1 -->
+        <register type="OA" address="0x00002798" value="0x0007FE9A" /> <!--OACEC5_0 -->
+        <register type="OA" address="0x0000279C" value="0x0000FF00" /> <!--OACEC5_1 -->
+        <register type="OA" address="0x000027A0" value="0x0007FF23" /> <!--OACEC6_0 -->
+        <register type="OA" address="0x000027A4" value="0x0000FF00" /> <!--OACEC6_1 -->
+        <register type="OA" address="0x000027A8" value="0x0007FFF3" /> <!--OACEC7_0 -->
+        <register type="OA" address="0x000027AC" value="0x0000FFFE" /> <!--OACEC7_1 -->
+    </register_config>
+  </set>
+
+  <set name="Memory Reads Distribution Gen7.5"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="memory_reads"
+       hw_config_guid="399d3001-97d6-4240-b065-4fb843138e17"
+       chipset="HSW"
+       symbol_name="MemoryReads"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="C 7 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="TES EU Stall"
+             description="The percentage of time in which evaluation shaders were stalled on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ds_eu_stall"
+             units="percent"
+             symbol_name="DsEuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Evaluation Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="LLC GPU Accesses"
+             description="The total number of LLC cache lookups done from the GPU (64b reads, 32B writes)."
+             data_type="uint64"
+             equation="PERFCNT1 READ_REG"
+             underscore_name="llc_accesses"
+             units="messages"
+             symbol_name="LlcAccesses"
+             availability="true $QueryMode &&"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="LLC"
+             />
+    <counter name="Alpha Test Fails"
+             description="The total number of pixels dropped on post-FS alpha test."
+             data_type="uint64"
+             equation="A 37 READ"
+             underscore_name="alpha_test_fails"
+             units="pixels"
+             symbol_name="AlphaTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="TES Threads Dispatched"
+             description="The total number of evaluation shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 15 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Evaluation Shader"
+             />
+    <counter name="TES AVG Active per Thread"
+             description="The average number of cycles per hardware thread run in which evaluation shaders were processed actively on the EUs."
+             data_type="uint64"
+             max_equation="100"
+             equation="A 12 READ $DsThreads UDIV"
+             underscore_name="ds_eu_active_per_thread"
+             units="cycles"
+             symbol_name="DsEuActivePerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="EU Array/Evaluation Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 25 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="GS EU Stall"
+             description="The percentage of time in which geometry shaders were stalled on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 23 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gs_eu_stall"
+             units="percent"
+             symbol_name="GsEuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Geometry Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="LLC GPU Read Accesses"
+             description="The total number of LLC cache lookups for reads done from the GPU."
+             data_type="uint64"
+             equation="C 6 READ"
+             underscore_name="llc_read_accesses"
+             units="messages"
+             symbol_name="LlcReadAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="LLC"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 30 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="GtiMemoryReads"
+             description="The total number of GTI memory reads (64B each)."
+             data_type="uint64"
+             equation="C 5 READ"
+             underscore_name="gti_memory_reads"
+             units="messages"
+             symbol_name="GtiMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 20 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="CS AVG Active per Thread"
+             description="The average number of cycles per hardware thread run in which compute shaders were processed actively on the EUs."
+             data_type="uint64"
+             max_equation="100"
+             equation="A 17 READ $CsThreads UDIV"
+             underscore_name="cs_eu_active_per_thread"
+             units="cycles"
+             symbol_name="CsEuActivePerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="EU Array/Compute Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiRczMemoryReads"
+             description="The total number of GTI memory reads from Render Depth Cache."
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="gti_rcz_memory_reads"
+             units="messages"
+             symbol_name="GtiRczMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="GS AVG Stall per Thread"
+             description="The average number of cycles per hardware thread run in which geometry shaders were stalled on the EUs."
+             data_type="uint64"
+             equation="A 23 READ $GsThreads UDIV"
+             underscore_name="gs_eu_stall_per_thread"
+             units="cycles"
+             symbol_name="GsEuStallPerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiRccMemoryReads"
+             description="The total number of GTI memory reads from Render Color Cache (Render Color Cache misses)."
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="gti_rcc_memory_reads"
+             units="messages"
+             symbol_name="GtiRccMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Color Cache"
+             />
+    <counter name="FS AVG Stall per Thread"
+             description="The average number of cycles per hardware thread run in which fragment shaders were stalled on the EUs."
+             data_type="uint64"
+             equation="A 28 READ $PsThreads UDIV"
+             underscore_name="ps_eu_stall_per_thread"
+             units="cycles"
+             symbol_name="PsEuStallPerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="TES EU Active"
+             description="The percentage of time in which evaluation shaders were processed actively on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ds_eu_active"
+             units="percent"
+             symbol_name="DsEuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Evaluation Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS AVG Stall per Thread"
+             description="The average number of cycles per hardware thread run in which vertex shaders were stalled on the EUs."
+             data_type="uint64"
+             equation="A 3 READ $VsThreads UDIV"
+             underscore_name="vs_eu_stall_per_thread"
+             units="cycles"
+             symbol_name="VsEuStallPerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="TCS EU Stall"
+             description="The percentage of time in which control shaders were stalled on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="hs_eu_stall"
+             units="percent"
+             symbol_name="HsEuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Control Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has being processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 41 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="FS AVG Active per Thread"
+             description="The average number of cycles per hardware thread run in which fragment shaders were processed actively on the EUs."
+             data_type="uint64"
+             max_equation="100"
+             equation="A 27 READ $PsThreads UDIV"
+             underscore_name="ps_eu_active_per_thread"
+             units="cycles"
+             symbol_name="PsEuActivePerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="EU Array/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiCmdStreamerMemoryReads"
+             description="The total number of GTI memory reads from Command Streamer."
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="gti_cmd_streamer_memory_reads"
+             units="messages"
+             symbol_name="GtiCmdStreamerMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Command Streamer"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="GS EU Active"
+             description="The percentage of time in which geometry shaders were processed actively on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 22 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gs_eu_active"
+             units="percent"
+             symbol_name="GsEuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Geometry Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="FS EU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 27 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_active"
+             units="percent"
+             symbol_name="PsEuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="TES AVG Stall per Thread"
+             description="The average number of cycles per hardware thread run in which evaluation shaders were stalled on the EUs."
+             data_type="uint64"
+             equation="A 13 READ $DsThreads UDIV"
+             underscore_name="ds_eu_stall_per_thread"
+             units="cycles"
+             symbol_name="DsEuStallPerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Evaluation Shader"
+             />
+    <counter name="GS AVG Active per Thread"
+             description="The average number of cycles per hardware thread run in which geometry shaders were processed actively on the EUs."
+             data_type="uint64"
+             max_equation="100"
+             equation="A 22 READ $GsThreads UDIV"
+             underscore_name="gs_eu_active_per_thread"
+             units="cycles"
+             symbol_name="GsEuActivePerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="EU Array/Geometry Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiHiDepthMemoryReads"
+             description="The total number of GTI memory reads from Hierarchical Depth Cache."
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="gti_hi_depth_memory_reads"
+             units="messages"
+             symbol_name="GtiHiDepthMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="TCS Threads Dispatched"
+             description="The total number of control shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 10 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Control Shader"
+             />
+    <counter name="TCS AVG Stall per Thread"
+             description="The average number of cycles per hardware thread run in which control shaders were stalled on the EUs."
+             data_type="uint64"
+             equation="A 8 READ $HsThreads UDIV"
+             underscore_name="hs_eu_stall_per_thread"
+             units="cycles"
+             symbol_name="HsEuStallPerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Control Shader"
+             />
+    <counter name="TCS EU Active"
+             description="The percentage of time in which control shaders were processed actively on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="hs_eu_active"
+             units="percent"
+             symbol_name="HsEuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Control Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 36 READ"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Late Depth Test Fails"
+             description="The total number of pixels dropped on post-FS depth test."
+             data_type="uint64"
+             equation="A 39 READ $SamplesKilledInPs USUB"
+             underscore_name="post_ps_depth_test_fails"
+             units="pixels"
+             symbol_name="PostPsDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="TCS AVG Active per Thread"
+             description="The average number of cycles per hardware thread run in which control shaders were processed actively on the EUs."
+             data_type="uint64"
+             max_equation="100"
+             equation="A 7 READ $HsThreads UDIV"
+             underscore_name="hs_eu_active_per_thread"
+             units="cycles"
+             symbol_name="HsEuActivePerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="EU Array/Control Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="FS EU Stall"
+             description="The percentage of time in which fragment shaders were stalled on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 28 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_stall"
+             units="percent"
+             symbol_name="PsEuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 1 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiMscMemoryReads"
+             description="The total number of GTI memory reads from Multisampling Color Cache (Multisampling Color Cache misses)."
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="gti_msc_memory_reads"
+             units="messages"
+             symbol_name="GtiMscMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Color Cache"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 33 READ"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS EU Active"
+             description="The percentage of time in which vertex shaders were processed actively on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 2 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_eu_active"
+             units="percent"
+             symbol_name="VsEuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="CS EU Active"
+             description="The percentage of time in which compute shaders were processed actively on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="cs_eu_active"
+             units="percent"
+             symbol_name="CsEuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Compute Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="CS AVG Stall per Thread"
+             description="The average number of cycles per hardware thread run in which compute shaders were stalled on the EUs."
+             data_type="uint64"
+             equation="A 18 READ $CsThreads UDIV"
+             underscore_name="cs_eu_stall_per_thread"
+             units="cycles"
+             symbol_name="CsEuStallPerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="LLC GPU Hits"
+             description="The total number of successful LLC cache lookups done from the GPU."
+             data_type="uint64"
+             equation="PERFCNT2 READ_REG"
+             underscore_name="llc_hits"
+             units="messages"
+             symbol_name="LlcHits"
+             availability="true $QueryMode &&"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="LLC"
+             />
+    <counter name="GtiVfMemoryReads"
+             description="The total number of GTI memory reads from Vertex Fetch."
+             data_type="uint64"
+             equation="B 1 READ"
+             underscore_name="gti_vf_memory_reads"
+             units="messages"
+             symbol_name="GtiVfMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Vertex Fetch"
+             />
+    <counter name="Late Stencil Test Fails"
+             description="The total number of pixels dropped on post-FS stencil test."
+             data_type="uint64"
+             equation="A 38 READ"
+             underscore_name="post_ps_stencil_test_fails"
+             units="pixels"
+             symbol_name="PostPsStencilTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GtiStcMemoryReads"
+             description="The total number of GTI memory reads from Stencil Cache."
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="gti_stc_memory_reads"
+             units="messages"
+             symbol_name="GtiStcMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="VS AVG Active per Thread"
+             description="The average number of cycles per hardware thread run in which vertex shaders were processed actively on the EUs."
+             data_type="uint64"
+             max_equation="100"
+             equation="A 2 READ $VsThreads UDIV"
+             underscore_name="vs_eu_active_per_thread"
+             units="cycles"
+             symbol_name="VsEuActivePerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiRsMemoryReads"
+             description="The total number of GTI memory reads from Resource Streamer."
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="gti_rs_memory_reads"
+             units="messages"
+             symbol_name="GtiRsMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Resource Streamer"
+             />
+    <counter name="CS EU Stall"
+             description="The percentage of time in which compute shaders were stalled on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="cs_eu_stall"
+             units="percent"
+             symbol_name="CsEuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Compute Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 40 READ"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GtiL3Reads"
+             description="The total number of GTI memory reads from L3 (L3 misses)."
+             data_type="uint64"
+             equation="C 4 READ"
+             underscore_name="gti_l3_reads"
+             units="messages"
+             symbol_name="GtiL3Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI"
+             />
+    <counter name="VS EU Stall"
+             description="The percentage of time in which vertex shaders were stalled on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 3 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_eu_stall"
+             units="percent"
+             symbol_name="VsEuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x000253A4" value="0x34300000" />
+        <register type="NOA" address="0x00025440" value="0x2D800000" />
+        <register type="NOA" address="0x00025444" value="0x00000008" />
+        <register type="NOA" address="0x00025128" value="0x0E600000" />
+        <register type="NOA" address="0x00025380" value="0x00000450" />
+        <register type="NOA" address="0x00025390" value="0x00052C43" />
+        <register type="NOA" address="0x00025384" value="0x00000000" />
+        <register type="NOA" address="0x00025400" value="0x00006144" />
+        <register type="NOA" address="0x00025408" value="0x0A418820" />
+        <register type="NOA" address="0x0002540C" value="0x000820E6" />
+        <register type="NOA" address="0x00025404" value="0xFF500000" />
+        <register type="NOA" address="0x00025100" value="0x000005D6" />
+        <register type="NOA" address="0x0002510C" value="0x0EF00000" />
+        <register type="NOA" address="0x00025104" value="0x00000000" />
+        <register type="NOA" address="0x00025420" value="0x02108421" />
+        <register type="NOA" address="0x00025424" value="0x00008421" />
+        <register type="NOA" address="0x0002541C" value="0x00000000" />
+        <register type="NOA" address="0x00025428" value="0x00000000" />
+        <register type="NOA" address="0x000091BC" value="0xE0400000" />
+        <register type="NOA" address="0x000091C4" value="0xE4500000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002724" value="0xF0800000" /> <!--OASTARTTRIG6 -->
+        <register type="OA" address="0x00002720" value="0x00000000" /> <!--OASTARTTRIG1 -->
+        <register type="OA" address="0x00002714" value="0xF0800000" /> <!--OASTARTTRIG1 -->
+        <register type="OA" address="0x00002710" value="0x00000000" /> <!--OASTARTTRIG1 -->
+        <register type="OA" address="0x0000274C" value="0x76543298" /> <!--OAREPORTTRIG4 -->
+        <register type="OA" address="0x00002748" value="0x98989898" /> <!--OAREPORTTRIG3 -->
+        <register type="OA" address="0x00002744" value="0x000000E4" /> <!--OAREPORTTRIG2 -->
+        <register type="OA" address="0x00002740" value="0x00000000" /> <!--OAREPORTTRIG1 -->
+        <register type="OA" address="0x0000275C" value="0x98A98A98" /> <!--OAREPORTTRIG8 -->
+        <register type="OA" address="0x00002758" value="0x88888888" /> <!--OAREPORTTRIG7 -->
+        <register type="OA" address="0x00002754" value="0x000C5500" /> <!--OAREPORTTRIG6 -->
+        <register type="OA" address="0x00002750" value="0x00000000" /> <!--OAREPORTTRIG5 -->
+        <register type="OA" address="0x00002770" value="0x0007F81A" /> <!--OACEC0_0 -->
+        <register type="OA" address="0x00002774" value="0x0000FC00" /> <!--OACEC0_1 -->
+        <register type="OA" address="0x00002778" value="0x0007F82A" /> <!--OACEC1_0 -->
+        <register type="OA" address="0x0000277C" value="0x0000FC00" /> <!--OACEC1_1 -->
+        <register type="OA" address="0x00002780" value="0x0007F872" /> <!--OACEC2_0 -->
+        <register type="OA" address="0x00002784" value="0x0000FC00" /> <!--OACEC2_1 -->
+        <register type="OA" address="0x00002788" value="0x0007F8BA" /> <!--OACEC3_0 -->
+        <register type="OA" address="0x0000278C" value="0x0000FC00" /> <!--OACEC3_1 -->
+        <register type="OA" address="0x00002790" value="0x0007F87A" /> <!--OACEC4_0 -->
+        <register type="OA" address="0x00002794" value="0x0000FC00" /> <!--OACEC4_1 -->
+        <register type="OA" address="0x00002798" value="0x0007F8EA" /> <!--OACEC5_0 -->
+        <register type="OA" address="0x0000279C" value="0x0000FC00" /> <!--OACEC5_1 -->
+        <register type="OA" address="0x000027A0" value="0x0007F8E2" /> <!--OACEC6_0 -->
+        <register type="OA" address="0x000027A4" value="0x0000FC00" /> <!--OACEC6_1 -->
+        <register type="OA" address="0x000027A8" value="0x0007F8F2" /> <!--OACEC7_0 -->
+        <register type="OA" address="0x000027AC" value="0x0000FC00" /> <!--OACEC7_1 -->
+    </register_config>
+  </set>
+
+  <set name="Memory Writes Distribution Gen7.5"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="memory_writes"
+       hw_config_guid="f3c1ff4b-d0da-4ffa-8780-2c6b98f3f2d5"
+       chipset="HSW"
+       symbol_name="MemoryWrites"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="C 7 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="TES EU Stall"
+             description="The percentage of time in which evaluation shaders were stalled on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ds_eu_stall"
+             units="percent"
+             symbol_name="DsEuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Evaluation Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="LLC GPU Accesses"
+             description="The total number of LLC cache lookups done from the GPU (64b reads, 32B writes)."
+             data_type="uint64"
+             equation="PERFCNT1 READ_REG"
+             underscore_name="llc_accesses"
+             units="messages"
+             symbol_name="LlcAccesses"
+             availability="true $QueryMode &&"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="LLC"
+             />
+    <counter name="Alpha Test Fails"
+             description="The total number of pixels dropped on post-FS alpha test."
+             data_type="uint64"
+             equation="A 37 READ"
+             underscore_name="alpha_test_fails"
+             units="pixels"
+             symbol_name="AlphaTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="TES Threads Dispatched"
+             description="The total number of evaluation shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 15 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Evaluation Shader"
+             />
+    <counter name="TES AVG Active per Thread"
+             description="The average number of cycles per hardware thread run in which evaluation shaders were processed actively on the EUs."
+             data_type="uint64"
+             max_equation="100"
+             equation="A 12 READ $DsThreads UDIV"
+             underscore_name="ds_eu_active_per_thread"
+             units="cycles"
+             symbol_name="DsEuActivePerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="EU Array/Evaluation Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 25 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="GS EU Stall"
+             description="The percentage of time in which geometry shaders were stalled on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 23 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gs_eu_stall"
+             units="percent"
+             symbol_name="GsEuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Geometry Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 30 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="GtiMscMemoryWrites"
+             description="The total number of GTI memory writes from Multisampling Color Cache (Multisampling Color Cache invalidations)."
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="gti_msc_memory_writes"
+             units="messages"
+             symbol_name="GtiMscMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Color Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 20 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="CS AVG Active per Thread"
+             description="The average number of cycles per hardware thread run in which compute shaders were processed actively on the EUs."
+             data_type="uint64"
+             max_equation="100"
+             equation="A 17 READ $CsThreads UDIV"
+             underscore_name="cs_eu_active_per_thread"
+             units="cycles"
+             symbol_name="CsEuActivePerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="EU Array/Compute Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiCmdStreamerMemoryWrites"
+             description="The total number of GTI memory writes from Command Streamer."
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="gti_cmd_streamer_memory_writes"
+             units="messages"
+             symbol_name="GtiCmdStreamerMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Command Streamer"
+             />
+    <counter name="GS AVG Stall per Thread"
+             description="The average number of cycles per hardware thread run in which geometry shaders were stalled on the EUs."
+             data_type="uint64"
+             equation="A 23 READ $GsThreads UDIV"
+             underscore_name="gs_eu_stall_per_thread"
+             units="cycles"
+             symbol_name="GsEuStallPerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="GtiL3Writes"
+             description="The total number of GTI memory writes from L3 (L3 invalidations)."
+             data_type="uint64"
+             equation="C 4 READ"
+             underscore_name="gti_l3_writes"
+             units="messages"
+             symbol_name="GtiL3Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiHizMemoryWrites"
+             description="The total number of GTI memory writes from Hierarchical Depth Cache."
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="gti_hiz_memory_writes"
+             units="messages"
+             symbol_name="GtiHizMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="FS AVG Stall per Thread"
+             description="The average number of cycles per hardware thread run in which fragment shaders were stalled on the EUs."
+             data_type="uint64"
+             equation="A 28 READ $PsThreads UDIV"
+             underscore_name="ps_eu_stall_per_thread"
+             units="cycles"
+             symbol_name="PsEuStallPerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="GtiRccMemoryWrites"
+             description="The total number of GTI memory writes from Render Color Cache (Render Color Cache invalidations)."
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="gti_rcc_memory_writes"
+             units="messages"
+             symbol_name="GtiRccMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Color Cache"
+             />
+    <counter name="TES EU Active"
+             description="The percentage of time in which evaluation shaders were processed actively on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ds_eu_active"
+             units="percent"
+             symbol_name="DsEuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Evaluation Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS AVG Stall per Thread"
+             description="The average number of cycles per hardware thread run in which vertex shaders were stalled on the EUs."
+             data_type="uint64"
+             equation="A 3 READ $VsThreads UDIV"
+             underscore_name="vs_eu_stall_per_thread"
+             units="cycles"
+             symbol_name="VsEuStallPerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="TCS EU Stall"
+             description="The percentage of time in which control shaders were stalled on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="hs_eu_stall"
+             units="percent"
+             symbol_name="HsEuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Control Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has being processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 41 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="FS AVG Active per Thread"
+             description="The average number of cycles per hardware thread run in which fragment shaders were processed actively on the EUs."
+             data_type="uint64"
+             max_equation="100"
+             equation="A 27 READ $PsThreads UDIV"
+             underscore_name="ps_eu_active_per_thread"
+             units="cycles"
+             symbol_name="PsEuActivePerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="EU Array/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="LLC GPU Write Accesses"
+             description="The total number of LLC cache lookups for write done from the GPU (32B writes)."
+             data_type="uint64"
+             equation="C 6 READ 2 UMUL"
+             underscore_name="llc_wr_accesses"
+             units="messages"
+             symbol_name="LlcWrAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="LLC"
+             />
+    <counter name="GS EU Active"
+             description="The percentage of time in which geometry shaders were processed actively on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 22 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gs_eu_active"
+             units="percent"
+             symbol_name="GsEuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Geometry Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="FS EU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 27 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_active"
+             units="percent"
+             symbol_name="PsEuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiStcMemoryWrites"
+             description="The total number of GTI memory writes from Stencil Cache."
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="gti_stc_memory_writes"
+             units="messages"
+             symbol_name="GtiStcMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="TES AVG Stall per Thread"
+             description="The average number of cycles per hardware thread run in which evaluation shaders were stalled on the EUs."
+             data_type="uint64"
+             equation="A 13 READ $DsThreads UDIV"
+             underscore_name="ds_eu_stall_per_thread"
+             units="cycles"
+             symbol_name="DsEuStallPerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Evaluation Shader"
+             />
+    <counter name="GS AVG Active per Thread"
+             description="The average number of cycles per hardware thread run in which geometry shaders were processed actively on the EUs."
+             data_type="uint64"
+             max_equation="100"
+             equation="A 22 READ $GsThreads UDIV"
+             underscore_name="gs_eu_active_per_thread"
+             units="cycles"
+             symbol_name="GsEuActivePerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="EU Array/Geometry Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="TCS Threads Dispatched"
+             description="The total number of control shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 10 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Control Shader"
+             />
+    <counter name="TCS AVG Stall per Thread"
+             description="The average number of cycles per hardware thread run in which control shaders were stalled on the EUs."
+             data_type="uint64"
+             equation="A 8 READ $HsThreads UDIV"
+             underscore_name="hs_eu_stall_per_thread"
+             units="cycles"
+             symbol_name="HsEuStallPerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Control Shader"
+             />
+    <counter name="TCS EU Active"
+             description="The percentage of time in which control shaders were processed actively on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="hs_eu_active"
+             units="percent"
+             symbol_name="HsEuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Control Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 36 READ"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Late Depth Test Fails"
+             description="The total number of pixels dropped on post-FS depth test."
+             data_type="uint64"
+             equation="A 39 READ $SamplesKilledInPs USUB"
+             underscore_name="post_ps_depth_test_fails"
+             units="pixels"
+             symbol_name="PostPsDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="TCS AVG Active per Thread"
+             description="The average number of cycles per hardware thread run in which control shaders were processed actively on the EUs."
+             data_type="uint64"
+             max_equation="100"
+             equation="A 7 READ $HsThreads UDIV"
+             underscore_name="hs_eu_active_per_thread"
+             units="cycles"
+             symbol_name="HsEuActivePerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="EU Array/Control Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="FS EU Stall"
+             description="The percentage of time in which fragment shaders were stalled on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 28 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_stall"
+             units="percent"
+             symbol_name="PsEuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 1 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 33 READ"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS EU Active"
+             description="The percentage of time in which vertex shaders were processed actively on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 2 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_eu_active"
+             units="percent"
+             symbol_name="VsEuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="CS EU Active"
+             description="The percentage of time in which compute shaders were processed actively on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="cs_eu_active"
+             units="percent"
+             symbol_name="CsEuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Compute Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="CS AVG Stall per Thread"
+             description="The average number of cycles per hardware thread run in which compute shaders were stalled on the EUs."
+             data_type="uint64"
+             equation="A 18 READ $CsThreads UDIV"
+             underscore_name="cs_eu_stall_per_thread"
+             units="cycles"
+             symbol_name="CsEuStallPerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="LLC GPU Hits"
+             description="The total number of successful LLC cache lookups done from the GPU."
+             data_type="uint64"
+             equation="PERFCNT2 READ_REG"
+             underscore_name="llc_hits"
+             units="messages"
+             symbol_name="LlcHits"
+             availability="true $QueryMode &&"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="LLC"
+             />
+    <counter name="Late Stencil Test Fails"
+             description="The total number of pixels dropped on post-FS stencil test."
+             data_type="uint64"
+             equation="A 38 READ"
+             underscore_name="post_ps_stencil_test_fails"
+             units="pixels"
+             symbol_name="PostPsStencilTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="LLC GPU Throughput"
+             description="The total number of GPU memory bytes transferred between GPU and LLC."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="PERFCNT1 READ_REG $LlcWrAccesses USUB 64 UMUL $LlcWrAccesses 32 UMUL UADD"
+             underscore_name="llc_gpu_throughput"
+             units="bytes"
+             symbol_name="LlcGpuThroughput"
+             availability="true $QueryMode &&"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="LLC"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiSoMemoryWrites"
+             description="The total number of GTI memory writes from Stream Output."
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="gti_so_memory_writes"
+             units="messages"
+             symbol_name="GtiSoMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Stream Output"
+             />
+    <counter name="VS AVG Active per Thread"
+             description="The average number of cycles per hardware thread run in which vertex shaders were processed actively on the EUs."
+             data_type="uint64"
+             max_equation="100"
+             equation="A 2 READ $VsThreads UDIV"
+             underscore_name="vs_eu_active_per_thread"
+             units="cycles"
+             symbol_name="VsEuActivePerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiRczMemoryWrites"
+             description="The total number of GTI memory writes from Render Depth Cache."
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="gti_rcz_memory_writes"
+             units="messages"
+             symbol_name="GtiRczMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="CS EU Stall"
+             description="The percentage of time in which compute shaders were stalled on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="cs_eu_stall"
+             units="percent"
+             symbol_name="CsEuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Compute Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 40 READ"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GtiMemoryWrites"
+             description="The total number of GTI memory writes (64B each)."
+             data_type="uint64"
+             equation="C 5 READ"
+             underscore_name="gti_memory_writes"
+             units="messages"
+             symbol_name="GtiMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI"
+             />
+    <counter name="VS EU Stall"
+             description="The percentage of time in which vertex shaders were stalled on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 3 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_eu_stall"
+             units="percent"
+             symbol_name="VsEuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x000253A4" value="0x34300000" />
+        <register type="NOA" address="0x00025440" value="0x01500000" />
+        <register type="NOA" address="0x00025444" value="0x00000120" />
+        <register type="NOA" address="0x00025128" value="0x0C200000" />
+        <register type="NOA" address="0x00025380" value="0x00000450" />
+        <register type="NOA" address="0x00025390" value="0x00052C43" />
+        <register type="NOA" address="0x00025384" value="0x00000000" />
+        <register type="NOA" address="0x00025400" value="0x00007184" />
+        <register type="NOA" address="0x00025408" value="0x0A418820" />
+        <register type="NOA" address="0x0002540C" value="0x000820E6" />
+        <register type="NOA" address="0x00025404" value="0xFF500000" />
+        <register type="NOA" address="0x00025100" value="0x000005D6" />
+        <register type="NOA" address="0x0002510C" value="0x1E700000" />
+        <register type="NOA" address="0x00025104" value="0x00000000" />
+        <register type="NOA" address="0x00025420" value="0x02108421" />
+        <register type="NOA" address="0x00025424" value="0x00008421" />
+        <register type="NOA" address="0x0002541C" value="0x00000000" />
+        <register type="NOA" address="0x00025428" value="0x00000000" />
+        <register type="NOA" address="0x000091BC" value="0xE0400000" />
+        <register type="NOA" address="0x000091C4" value="0xE4500000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002724" value="0xF0800000" /> <!--OASTARTTRIG6 -->
+        <register type="OA" address="0x00002720" value="0x00000000" /> <!--OASTARTTRIG1 -->
+        <register type="OA" address="0x00002714" value="0xF0800000" /> <!--OASTARTTRIG1 -->
+        <register type="OA" address="0x00002710" value="0x00000000" /> <!--OASTARTTRIG1 -->
+        <register type="OA" address="0x0000274C" value="0x76543298" /> <!--OAREPORTTRIG4 -->
+        <register type="OA" address="0x00002748" value="0x98989898" /> <!--OAREPORTTRIG3 -->
+        <register type="OA" address="0x00002744" value="0x000000E4" /> <!--OAREPORTTRIG2 -->
+        <register type="OA" address="0x00002740" value="0x00000000" /> <!--OAREPORTTRIG1 -->
+        <register type="OA" address="0x0000275C" value="0xBABABABA" /> <!--OAREPORTTRIG8 -->
+        <register type="OA" address="0x00002758" value="0x88888888" /> <!--OAREPORTTRIG7 -->
+        <register type="OA" address="0x00002754" value="0x000C5500" /> <!--OAREPORTTRIG6 -->
+        <register type="OA" address="0x00002750" value="0x00000000" /> <!--OAREPORTTRIG5 -->
+        <register type="OA" address="0x00002770" value="0x0007F81A" /> <!--OACEC0_0 -->
+        <register type="OA" address="0x00002774" value="0x0000FC00" /> <!--OACEC0_1 -->
+        <register type="OA" address="0x00002778" value="0x0007F82A" /> <!--OACEC1_0 -->
+        <register type="OA" address="0x0000277C" value="0x0000FC00" /> <!--OACEC1_1 -->
+        <register type="OA" address="0x00002780" value="0x0007F822" /> <!--OACEC2_0 -->
+        <register type="OA" address="0x00002784" value="0x0000FC00" /> <!--OACEC2_1 -->
+        <register type="OA" address="0x00002788" value="0x0007F8BA" /> <!--OACEC3_0 -->
+        <register type="OA" address="0x0000278C" value="0x0000FC00" /> <!--OACEC3_1 -->
+        <register type="OA" address="0x00002790" value="0x0007F87A" /> <!--OACEC4_0 -->
+        <register type="OA" address="0x00002794" value="0x0000FC00" /> <!--OACEC4_1 -->
+        <register type="OA" address="0x00002798" value="0x0007F8EA" /> <!--OACEC5_0 -->
+        <register type="OA" address="0x0000279C" value="0x0000FC00" /> <!--OACEC5_1 -->
+        <register type="OA" address="0x000027A0" value="0x0007F8E2" /> <!--OACEC6_0 -->
+        <register type="OA" address="0x000027A4" value="0x0000FC00" /> <!--OACEC6_1 -->
+        <register type="OA" address="0x000027A8" value="0x0007F8F2" /> <!--OACEC7_0 -->
+        <register type="OA" address="0x000027AC" value="0x0000FC00" /> <!--OACEC7_1 -->
+    </register_config>
+  </set>
+
+  <set name="Metric set SamplerBalance"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="sampler_balance"
+       hw_config_guid="e111cda4-19c3-41ee-b326-f99ac44ebf78"
+       chipset="HSW"
+       symbol_name="SamplerBalance"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="TES EU Stall"
+             description="The percentage of time in which evaluation shaders were stalled on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ds_eu_stall"
+             units="percent"
+             symbol_name="DsEuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Evaluation Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="LLC GPU Accesses"
+             description="The total number of LLC cache lookups done from the GPU (64b reads, 32B writes)."
+             data_type="uint64"
+             equation="PERFCNT1 READ_REG"
+             underscore_name="llc_accesses"
+             units="messages"
+             symbol_name="LlcAccesses"
+             availability="true $QueryMode &&"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="LLC"
+             />
+    <counter name="Sampler L2 cache misses (ss3)"
+             description="Number of sampler L2 cache misses (ss3)"
+             data_type="uint64"
+             equation="C 1 READ C 0 READ UADD"
+             underscore_name="sampler3_l2_cache_misses"
+             units="messages"
+             symbol_name="Sampler3L2CacheMisses"
+             availability="$SubsliceMask 0x8 AND"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="Alpha Test Fails"
+             description="The total number of pixels dropped on post-FS alpha test."
+             data_type="uint64"
+             equation="A 37 READ"
+             underscore_name="alpha_test_fails"
+             units="pixels"
+             symbol_name="AlphaTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="TES Threads Dispatched"
+             description="The total number of evaluation shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 15 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Evaluation Shader"
+             />
+    <counter name="TES AVG Active per Thread"
+             description="The average number of cycles per hardware thread run in which evaluation shaders were processed actively on the EUs."
+             data_type="uint64"
+             max_equation="100"
+             equation="A 12 READ $DsThreads UDIV"
+             underscore_name="ds_eu_active_per_thread"
+             units="cycles"
+             symbol_name="DsEuActivePerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="EU Array/Evaluation Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 25 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="GS EU Stall"
+             description="The percentage of time in which geometry shaders were stalled on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 23 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gs_eu_stall"
+             units="percent"
+             symbol_name="GsEuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Geometry Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="CS EU Active"
+             description="The percentage of time in which compute shaders were processed actively on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="cs_eu_active"
+             units="percent"
+             symbol_name="CsEuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Compute Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS EU Active"
+             description="The percentage of time in which vertex shaders were processed actively on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 2 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_eu_active"
+             units="percent"
+             symbol_name="VsEuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="TCS EU Active"
+             description="The percentage of time in which control shaders were processed actively on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="hs_eu_active"
+             units="percent"
+             symbol_name="HsEuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Control Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="TES EU Active"
+             description="The percentage of time in which evaluation shaders were processed actively on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ds_eu_active"
+             units="percent"
+             symbol_name="DsEuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Evaluation Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS EU Active"
+             description="The percentage of time in which geometry shaders were processed actively on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 22 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gs_eu_active"
+             units="percent"
+             symbol_name="GsEuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Geometry Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="FS EU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 27 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_active"
+             units="percent"
+             symbol_name="PsEuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="CS EU Stall"
+             description="The percentage of time in which compute shaders were stalled on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="cs_eu_stall"
+             units="percent"
+             symbol_name="CsEuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Compute Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 1 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS EU Stall"
+             description="The percentage of time in which vertex shaders were stalled on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 3 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_eu_stall"
+             units="percent"
+             symbol_name="VsEuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="TCS EU Stall"
+             description="The percentage of time in which control shaders were stalled on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="hs_eu_stall"
+             units="percent"
+             symbol_name="HsEuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Control Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="FS EU Stall"
+             description="The percentage of time in which fragment shaders were stalled on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 28 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_stall"
+             units="percent"
+             symbol_name="PsEuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="CS Duration"
+             description="Total Compute Shader GPU duration."
+             data_type="uint64"
+             equation="A 17 READ  A 0 READ UMUL  A 2 READ  A 7 READ UADD  A 12 READ UADD  A 17 READ UADD  A 22 READ UADD  A 27 READ UADD UDIV  A 18 READ  A 1 READ UMUL  A 3 READ  A 8 READ UADD  A 13 READ UADD  A 18 READ UADD  A 23 READ UADD  A 28 READ UADD UDIV UADD $GpuTime UMUL $GpuCoreClocks $EuCoresTotalCount UMUL 1000 UMUL UDIV"
+             underscore_name="cs_duration"
+             units="us"
+             symbol_name="CsDuration"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 30 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="TES Duration"
+             description="Total Evaluation Shader GPU duration."
+             data_type="uint64"
+             equation="A 12 READ  A 0 READ UMUL  A 2 READ  A 7 READ UADD  A 12 READ UADD  A 17 READ UADD  A 22 READ UADD  A 27 READ UADD UDIV  A 13 READ  A 1 READ UMUL  A 3 READ  A 8 READ UADD  A 13 READ UADD  A 18 READ UADD  A 23 READ UADD  A 28 READ UADD UDIV UADD $GpuTime UMUL $GpuCoreClocks $EuCoresTotalCount UMUL 1000 UMUL UDIV"
+             underscore_name="ds_duration"
+             units="us"
+             symbol_name="DsDuration"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Evaluation Shader"
+             />
+    <counter name="GS Duration"
+             description="Total Geometry Shader GPU duration."
+             data_type="uint64"
+             equation="A 22 READ  A 0 READ UMUL  A 2 READ  A 7 READ UADD  A 12 READ UADD  A 17 READ UADD  A 22 READ UADD  A 27 READ UADD UDIV  A 23 READ  A 1 READ UMUL  A 3 READ  A 8 READ UADD  A 13 READ UADD  A 18 READ UADD  A 23 READ UADD  A 28 READ UADD UDIV UADD $GpuTime UMUL $GpuCoreClocks $EuCoresTotalCount UMUL 1000 UMUL UDIV"
+             underscore_name="gs_duration"
+             units="us"
+             symbol_name="GsDuration"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 20 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="CS AVG Active per Thread"
+             description="The average number of cycles per hardware thread run in which compute shaders were processed actively on the EUs."
+             data_type="uint64"
+             max_equation="100"
+             equation="A 17 READ $CsThreads UDIV"
+             underscore_name="cs_eu_active_per_thread"
+             units="cycles"
+             symbol_name="CsEuActivePerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="EU Array/Compute Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler L2 cache misses"
+             description="Number of sampler L2 cache misses"
+             data_type="uint64"
+             equation="C 7 READ C 6 READ UADD C 5 READ UADD C 4 READ UADD C 3 READ UADD C 2 READ UADD C 1 READ UADD C 0 READ UADD"
+             underscore_name="sampler_l2_cache_misses"
+             units="messages"
+             symbol_name="SamplerL2CacheMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler"
+             />
+    <counter name="GS AVG Stall per Thread"
+             description="The average number of cycles per hardware thread run in which geometry shaders were stalled on the EUs."
+             data_type="uint64"
+             equation="A 23 READ $GsThreads UDIV"
+             underscore_name="gs_eu_stall_per_thread"
+             units="cycles"
+             symbol_name="GsEuStallPerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Sampler L2 cache misses (ss2)"
+             description="Number of sampler L2 cache misses (ss2)"
+             data_type="uint64"
+             equation="C 3 READ C 2 READ UADD"
+             underscore_name="sampler2_l2_cache_misses"
+             units="messages"
+             symbol_name="Sampler2L2CacheMisses"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Idle"
+             description="The percentage of time in which the Execution Units were idle."
+             data_type="float"
+             max_equation="100"
+             equation="100 $EuActive $EuStall FADD FSUB"
+             underscore_name="eu_idle"
+             units="percent"
+             symbol_name="EuIdle"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="FS AVG Stall per Thread"
+             description="The average number of cycles per hardware thread run in which fragment shaders were stalled on the EUs."
+             data_type="uint64"
+             equation="A 28 READ $PsThreads UDIV"
+             underscore_name="ps_eu_stall_per_thread"
+             units="cycles"
+             symbol_name="PsEuStallPerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="VS AVG Stall per Thread"
+             description="The average number of cycles per hardware thread run in which vertex shaders were stalled on the EUs."
+             data_type="uint64"
+             equation="A 3 READ $VsThreads UDIV"
+             underscore_name="vs_eu_stall_per_thread"
+             units="cycles"
+             symbol_name="VsEuStallPerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has being processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 41 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="FS AVG Active per Thread"
+             description="The average number of cycles per hardware thread run in which fragment shaders were processed actively on the EUs."
+             data_type="uint64"
+             max_equation="100"
+             equation="A 27 READ $PsThreads UDIV"
+             underscore_name="ps_eu_active_per_thread"
+             units="cycles"
+             symbol_name="PsEuActivePerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="EU Array/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="TCS Duration"
+             description="Total Control Shader GPU duration."
+             data_type="uint64"
+             equation="A 7 READ  A 0 READ UMUL  A 2 READ  A 7 READ UADD  A 12 READ UADD  A 17 READ UADD  A 22 READ UADD  A 27 READ UADD UDIV  A 8 READ  A 1 READ UMUL  A 3 READ  A 8 READ UADD  A 13 READ UADD  A 18 READ UADD  A 23 READ UADD  A 28 READ UADD UDIV UADD $GpuTime UMUL $GpuCoreClocks $EuCoresTotalCount UMUL 1000 UMUL UDIV"
+             underscore_name="hs_duration"
+             units="us"
+             symbol_name="HsDuration"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Control Shader"
+             />
+    <counter name="TES AVG Stall per Thread"
+             description="The average number of cycles per hardware thread run in which evaluation shaders were stalled on the EUs."
+             data_type="uint64"
+             equation="A 13 READ $DsThreads UDIV"
+             underscore_name="ds_eu_stall_per_thread"
+             units="cycles"
+             symbol_name="DsEuStallPerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Evaluation Shader"
+             />
+    <counter name="GS AVG Active per Thread"
+             description="The average number of cycles per hardware thread run in which geometry shaders were processed actively on the EUs."
+             data_type="uint64"
+             max_equation="100"
+             equation="A 22 READ $GsThreads UDIV"
+             underscore_name="gs_eu_active_per_thread"
+             units="cycles"
+             symbol_name="GsEuActivePerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="EU Array/Geometry Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="TCS Threads Dispatched"
+             description="The total number of control shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 10 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Control Shader"
+             />
+    <counter name="TCS AVG Stall per Thread"
+             description="The average number of cycles per hardware thread run in which control shaders were stalled on the EUs."
+             data_type="uint64"
+             equation="A 8 READ $HsThreads UDIV"
+             underscore_name="hs_eu_stall_per_thread"
+             units="cycles"
+             symbol_name="HsEuStallPerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Control Shader"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 36 READ"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Late Depth Test Fails"
+             description="The total number of pixels dropped on post-FS depth test."
+             data_type="uint64"
+             equation="A 39 READ $SamplesKilledInPs USUB"
+             underscore_name="post_ps_depth_test_fails"
+             units="pixels"
+             symbol_name="PostPsDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="TCS AVG Active per Thread"
+             description="The average number of cycles per hardware thread run in which control shaders were processed actively on the EUs."
+             data_type="uint64"
+             max_equation="100"
+             equation="A 7 READ $HsThreads UDIV"
+             underscore_name="hs_eu_active_per_thread"
+             units="cycles"
+             symbol_name="HsEuActivePerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="EU Array/Control Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="FS Duration"
+             description="Total Fragment Shader GPU duration."
+             data_type="uint64"
+             equation="A 27 READ  A 0 READ UMUL  A 2 READ  A 7 READ UADD  A 12 READ UADD  A 17 READ UADD  A 22 READ UADD  A 27 READ UADD UDIV  A 28 READ  A 1 READ UMUL  A 3 READ  A 8 READ UADD  A 13 READ UADD  A 18 READ UADD  A 23 READ UADD  A 28 READ UADD UDIV UADD $GpuTime UMUL $GpuCoreClocks $EuCoresTotalCount UMUL 1000 UMUL UDIV"
+             underscore_name="ps_duration"
+             units="us"
+             symbol_name="PsDuration"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Sampler L2 cache misses (ss1)"
+             description="Number of sampler L2 cache misses (ss1)"
+             data_type="uint64"
+             equation="C 5 READ C 4 READ UADD"
+             underscore_name="sampler1_l2_cache_misses"
+             units="messages"
+             symbol_name="Sampler1L2CacheMisses"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 33 READ"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="CS AVG Stall per Thread"
+             description="The average number of cycles per hardware thread run in which compute shaders were stalled on the EUs."
+             data_type="uint64"
+             equation="A 18 READ $CsThreads UDIV"
+             underscore_name="cs_eu_stall_per_thread"
+             units="cycles"
+             symbol_name="CsEuStallPerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="LLC GPU Hits"
+             description="The total number of successful LLC cache lookups done from the GPU."
+             data_type="uint64"
+             equation="PERFCNT2 READ_REG"
+             underscore_name="llc_hits"
+             units="messages"
+             symbol_name="LlcHits"
+             availability="true $QueryMode &&"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="LLC"
+             />
+    <counter name="Late Stencil Test Fails"
+             description="The total number of pixels dropped on post-FS stencil test."
+             data_type="uint64"
+             equation="A 38 READ"
+             underscore_name="post_ps_stencil_test_fails"
+             units="pixels"
+             symbol_name="PostPsStencilTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Sampler L2 cache misses (ss0)"
+             description="Number of sampler L2 cache misses (ss0)"
+             data_type="uint64"
+             equation="C 7 READ C 6 READ UADD"
+             underscore_name="sampler0_l2_cache_misses"
+             units="messages"
+             symbol_name="Sampler0L2CacheMisses"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="VS AVG Active per Thread"
+             description="The average number of cycles per hardware thread run in which vertex shaders were processed actively on the EUs."
+             data_type="uint64"
+             max_equation="100"
+             equation="A 2 READ $VsThreads UDIV"
+             underscore_name="vs_eu_active_per_thread"
+             units="cycles"
+             symbol_name="VsEuActivePerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Duration"
+             description="Total Vertex Shader GPU duration."
+             data_type="uint64"
+             equation="A 2 READ  A 0 READ UMUL  A 2 READ  A 7 READ UADD  A 12 READ UADD  A 17 READ UADD  A 22 READ UADD  A 27 READ UADD UDIV  A 3 READ  A 1 READ UMUL  A 3 READ  A 8 READ UADD  A 13 READ UADD  A 18 READ UADD  A 23 READ UADD  A 28 READ UADD UDIV UADD $GpuTime UMUL $GpuCoreClocks $EuCoresTotalCount UMUL 1000 UMUL UDIV"
+             underscore_name="vs_duration"
+             units="us"
+             symbol_name="VsDuration"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 40 READ"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x0002EB9C" value="0x01906400" />
+        <register type="NOA" address="0x0002FB9C" value="0x01906400" />
+        <register type="NOA" address="0x000253A4" value="0x00000000" />
+        <register type="NOA" address="0x00026B9C" value="0x01906400" />
+        <register type="NOA" address="0x00027B9C" value="0x01906400" />
+        <register type="NOA" address="0x00027104" value="0x00A00000" />
+        <register type="NOA" address="0x00027184" value="0x00A50000" />
+        <register type="NOA" address="0x0002E804" value="0x00500000" />
+        <register type="NOA" address="0x0002E984" value="0x00500000" />
+        <register type="NOA" address="0x0002EB04" value="0x00500000" />
+        <register type="NOA" address="0x0002EB80" value="0x00000084" />
+        <register type="NOA" address="0x0002EB8C" value="0x14200000" />
+        <register type="NOA" address="0x0002EB84" value="0x00000000" />
+        <register type="NOA" address="0x0002F804" value="0x00050000" />
+        <register type="NOA" address="0x0002F984" value="0x00050000" />
+        <register type="NOA" address="0x0002FB04" value="0x00050000" />
+        <register type="NOA" address="0x0002FB80" value="0x00000084" />
+        <register type="NOA" address="0x0002FB8C" value="0x00050800" />
+        <register type="NOA" address="0x0002FB84" value="0x00000000" />
+        <register type="NOA" address="0x00025380" value="0x00000010" />
+        <register type="NOA" address="0x0002538C" value="0x000000C0" />
+        <register type="NOA" address="0x00025384" value="0xAA550000" />
+        <register type="NOA" address="0x00025404" value="0xFFFFC000" />
+        <register type="NOA" address="0x00026804" value="0x50000000" />
+        <register type="NOA" address="0x00026984" value="0x50000000" />
+        <register type="NOA" address="0x00026B04" value="0x50000000" />
+        <register type="NOA" address="0x00026B80" value="0x00000084" />
+        <register type="NOA" address="0x00026B90" value="0x00050800" />
+        <register type="NOA" address="0x00026B84" value="0x00000000" />
+        <register type="NOA" address="0x00027804" value="0x05000000" />
+        <register type="NOA" address="0x00027984" value="0x05000000" />
+        <register type="NOA" address="0x00027B04" value="0x05000000" />
+        <register type="NOA" address="0x00027B80" value="0x00000084" />
+        <register type="NOA" address="0x00027B90" value="0x00000142" />
+        <register type="NOA" address="0x00027B84" value="0x00000000" />
+        <register type="NOA" address="0x00026104" value="0xA0000000" />
+        <register type="NOA" address="0x00026184" value="0xA5000000" />
+        <register type="NOA" address="0x00025424" value="0x00008620" />
+        <register type="NOA" address="0x0002541C" value="0x00000000" />
+        <register type="NOA" address="0x00025428" value="0x0004A54A" />
+        <register type="NOA" address="0x000091BC" value="0xE0400000" />
+        <register type="NOA" address="0x000091C4" value="0xE4500000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" /> <!--OAREPORTTRIG1 -->
+        <register type="OA" address="0x00002744" value="0x00800000" /> <!--OAREPORTTRIG2 -->
+        <register type="OA" address="0x00002710" value="0x00000000" /> <!--OASTARTTRIG1 -->
+        <register type="OA" address="0x00002714" value="0x00800000" /> <!--OASTARTTRIG1 -->
+        <register type="OA" address="0x00002720" value="0x00000000" /> <!--OASTARTTRIG1 -->
+        <register type="OA" address="0x00002724" value="0x00800000" /> <!--OASTARTTRIG6 -->
+    </register_config>
+  </set>
+
+</metrics>
diff --git a/lib/i915/perf-configs/oa-icl.xml b/lib/i915/perf-configs/oa-icl.xml
new file mode 100644
index 00000000..0b519415
--- /dev/null
+++ b/lib/i915/perf-configs/oa-icl.xml
@@ -0,0 +1,11869 @@
+<?xml version="1.0"?>
+<metrics version="1581935520" merge_md5="">
+  <set name="Render Metrics Basic Gen11"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="render_basic"
+       hw_config_guid="193093b2-da24-49bf-b407-442c213b71b4"
+       chipset="ICL"
+       symbol_name="RenderBasic"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Cache Misses"
+             description="The total number of sampler cache misses in all LODs in all sampler units."
+             data_type="uint64"
+             equation="C 4 READ C 5 READ UADD 2 UMUL"
+             underscore_name="sampler_l1_misses"
+             units="messages"
+             symbol_name="SamplerL1Misses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Sampler00 Busy"
+             description="The percentage of time in which Slice0 Sampler0 has been processing EU requests."
+             data_type="float"
+             max_equation="100"
+             equation="C 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler00_busy"
+             units="percent"
+             symbol_name="Sampler00Busy"
+             availability="$SubsliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Samplers Busy"
+             description="The percentage of time in which samplers have been processing EU requests."
+             data_type="float"
+             max_equation="100"
+             equation="$Sampler00Busy"
+             underscore_name="samplers_busy"
+             units="percent"
+             symbol_name="SamplersBusy"
+             availability="$SubsliceMask 9 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="Sampler00 Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which Slice0 Sampler0 has been slowing down the pipe when processing EU requests."
+             data_type="float"
+             high_watermark="15"
+             equation="C 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="sampler00_bottleneck"
+             units="percent"
+             symbol_name="Sampler00Bottleneck"
+             availability="$SubsliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Read Throughput"
+             description="The total number of GPU memory bytes read from GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="64  B 1 READ B 3 READ UADD B 4 READ UADD B 5 READ UADD UMUL"
+             underscore_name="gti_read_throughput"
+             units="bytes"
+             symbol_name="GtiReadThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 14 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Samplers Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which samplers have been slowing down the pipe when processing EU requests."
+             data_type="float"
+             high_watermark="15"
+             equation="$Sampler00Bottleneck"
+             max_equation="100"
+             underscore_name="sampler_bottleneck"
+             units="percent"
+             symbol_name="SamplerBottleneck"
+             availability="$SubsliceMask 9 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Indicate System Frame Batch Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="GTI Write Throughput"
+             description="The total number of GPU memory bytes written to GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="64  B 0 READ B 2 READ UADD UMUL"
+             underscore_name="gti_write_throughput"
+             units="bytes"
+             symbol_name="GtiWriteThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="$ShaderMemoryAccesses 64 UMUL"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009840" value="0x00000000" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x142C0014" />
+        <register type="NOA" address="0x00009888" value="0x14120700" />
+        <register type="NOA" address="0x00009888" value="0x121500E0" />
+        <register type="NOA" address="0x00009888" value="0x1C1E000C" />
+        <register type="NOA" address="0x00009888" value="0x0E1F000C" />
+        <register type="NOA" address="0x00009888" value="0x1C200014" />
+        <register type="NOA" address="0x00009888" value="0x16212800" />
+        <register type="NOA" address="0x00009888" value="0x0E2C2041" />
+        <register type="NOA" address="0x00009888" value="0x102C0000" />
+        <register type="NOA" address="0x00009888" value="0x1A2C0000" />
+        <register type="NOA" address="0x00009888" value="0x10040140" />
+        <register type="NOA" address="0x00009888" value="0x0E040005" />
+        <register type="NOA" address="0x00009888" value="0x14050050" />
+        <register type="NOA" address="0x00009888" value="0x06054000" />
+        <register type="NOA" address="0x00009888" value="0x08051000" />
+        <register type="NOA" address="0x00009888" value="0x260600C0" />
+        <register type="NOA" address="0x00009888" value="0x24061800" />
+        <register type="NOA" address="0x00009888" value="0x04120023" />
+        <register type="NOA" address="0x00009888" value="0x10120000" />
+        <register type="NOA" address="0x00009888" value="0x08120000" />
+        <register type="NOA" address="0x00009888" value="0x06131000" />
+        <register type="NOA" address="0x00009888" value="0x04144000" />
+        <register type="NOA" address="0x00009888" value="0x02150980" />
+        <register type="NOA" address="0x00009888" value="0x10150000" />
+        <register type="NOA" address="0x00009888" value="0x1815000F" />
+        <register type="NOA" address="0x00009888" value="0x06150000" />
+        <register type="NOA" address="0x00009888" value="0x08154000" />
+        <register type="NOA" address="0x00009888" value="0x0E18A000" />
+        <register type="NOA" address="0x00009888" value="0x14190028" />
+        <register type="NOA" address="0x00009884" value="0x00000003" />
+        <register type="NOA" address="0x00009888" value="0x1A1C01C0" />
+        <register type="NOA" address="0x00009888" value="0x1C1C000A" />
+        <register type="NOA" address="0x00009888" value="0x1A5C01C0" />
+        <register type="NOA" address="0x00009888" value="0x1C5C000A" />
+        <register type="NOA" address="0x00009888" value="0x001C0097" />
+        <register type="NOA" address="0x00009888" value="0x061C9400" />
+        <register type="NOA" address="0x00009888" value="0x0A1C00A7" />
+        <register type="NOA" address="0x00009888" value="0x101C0000" />
+        <register type="NOA" address="0x00009888" value="0x081D8100" />
+        <register type="NOA" address="0x00009888" value="0x0A1D0004" />
+        <register type="NOA" address="0x00009888" value="0x085C9497" />
+        <register type="NOA" address="0x00009888" value="0x0A5CA700" />
+        <register type="NOA" address="0x00009888" value="0x105C0000" />
+        <register type="NOA" address="0x00009888" value="0x0A5D000B" />
+        <register type="NOA" address="0x00009888" value="0x181E8000" />
+        <register type="NOA" address="0x00009888" value="0x1E1EEF80" />
+        <register type="NOA" address="0x00009888" value="0x301F4000" />
+        <register type="NOA" address="0x00009888" value="0x501F2404" />
+        <register type="NOA" address="0x00009888" value="0x521F0092" />
+        <register type="NOA" address="0x00009888" value="0x541F0024" />
+        <register type="NOA" address="0x00009888" value="0x4E1F2000" />
+        <register type="NOA" address="0x00009888" value="0x3E1F0300" />
+        <register type="NOA" address="0x00009888" value="0x461F0303" />
+        <register type="NOA" address="0x00009888" value="0x481F0303" />
+        <register type="NOA" address="0x00009888" value="0x4A1F0003" />
+        <register type="NOA" address="0x00009888" value="0x181F0000" />
+        <register type="NOA" address="0x00009888" value="0x4C1F0000" />
+        <register type="NOA" address="0x00009888" value="0x421F4001" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E65C" value="0xFFFFFFFF" />
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00051050" />
+        <register type="FLEX" address="0x0000E45C" value="0x00000052" />
+    </register_config>
+  </set>
+
+  <set name="Compute Metrics Basic Gen11"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="compute_basic"
+       hw_config_guid="12ca7e9c-55cb-45cd-9f87-4fc821488e6d"
+       chipset="ICL"
+       symbol_name="ComputeBasic"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Untyped Bytes Read"
+             description="The total number of typed memory bytes read via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 3 READ C 2 READ UADD $EuSubslicesTotalCount UMUL 32 UMUL"
+             underscore_name="untyped_bytes_read"
+             units="bytes"
+             symbol_name="UntypedBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Typed Bytes Written"
+             description="The total number of untyped memory bytes written via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 5 READ C 4 READ UADD $EuSubslicesTotalCount UMUL 32 UMUL"
+             underscore_name="typed_bytes_written"
+             units="bytes"
+             symbol_name="TypedBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU AVG IPC Rate"
+             description="The average rate of IPC calculated for 2 FPU pipelines."
+             data_type="float"
+             max_equation="2"
+             equation="A 9 READ A 10 READ A 11 READ FADD A 9 READ FSUB FDIV 1 FADD"
+             underscore_name="eu_avg_ipc_rate"
+             units="number"
+             symbol_name="EuAvgIpcRate"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="EU FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active"
+             units="percent"
+             symbol_name="Fpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu0_active"
+             units="percent"
+             symbol_name="Fpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Typed Atomics Accesses"
+             description="The total number of typed atomic accesses via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="B 4 READ B 5 READ FADD 2 FDIV $EuSubslicesTotalCount FMUL"
+             underscore_name="typed_atomics"
+             units="events"
+             symbol_name="TypedAtomics"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Read Throughput"
+             description="The total number of GPU memory bytes read from GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="64  B 1 READ B 3 READ UADD B 6 READ UADD B 7 READ UADD UMUL"
+             underscore_name="gti_read_throughput"
+             units="bytes"
+             symbol_name="GtiReadThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Untyped Writes"
+             description="The total number of untyped memory bytes written via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 1 READ C 0 READ UADD $EuSubslicesTotalCount UMUL 32 UMUL"
+             underscore_name="untyped_bytes_written"
+             units="bytes"
+             symbol_name="UntypedBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="Typed Bytes Read"
+             description="The total number of typed memory bytes read via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 7 READ C 6 READ UADD $EuSubslicesTotalCount UMUL 32 UMUL"
+             underscore_name="typed_bytes_read"
+             units="bytes"
+             symbol_name="TypedBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="EU Thread Occupancy"
+             description="The percentage of time in which hardware threads occupied EUs."
+             data_type="float"
+             max_equation="100"
+             equation="8 A 13 READ FMUL $EuThreadsCount FDIV $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_thread_occupancy"
+             units="percent"
+             symbol_name="EuThreadOccupancy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="GTI Write Throughput"
+             description="The total number of GPU memory bytes written to GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="64  B 0 READ B 2 READ UADD UMUL"
+             underscore_name="gti_write_throughput"
+             units="bytes"
+             symbol_name="GtiWriteThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="$ShaderMemoryAccesses 64 UMUL"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="EU Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_send_active"
+             units="percent"
+             symbol_name="EuSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009840" value="0x00000000" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x12230012" />
+        <register type="NOA" address="0x00009888" value="0x10230019" />
+        <register type="NOA" address="0x00009888" value="0x12A30012" />
+        <register type="NOA" address="0x00009888" value="0x10A30019" />
+        <register type="NOA" address="0x00009888" value="0x1A200400" />
+        <register type="NOA" address="0x00009888" value="0x1C200020" />
+        <register type="NOA" address="0x00009888" value="0x04208000" />
+        <register type="NOA" address="0x00009888" value="0x08208000" />
+        <register type="NOA" address="0x00009888" value="0x0C208000" />
+        <register type="NOA" address="0x00009888" value="0x0A230031" />
+        <register type="NOA" address="0x00009888" value="0x0E231E00" />
+        <register type="NOA" address="0x00009888" value="0x0223003D" />
+        <register type="NOA" address="0x00009888" value="0x04230032" />
+        <register type="NOA" address="0x00009888" value="0x06230033" />
+        <register type="NOA" address="0x00009888" value="0x00230000" />
+        <register type="NOA" address="0x00009888" value="0x1AA01000" />
+        <register type="NOA" address="0x00009888" value="0x1CA00008" />
+        <register type="NOA" address="0x00009888" value="0x02A08000" />
+        <register type="NOA" address="0x00009888" value="0x06A08000" />
+        <register type="NOA" address="0x00009888" value="0x0AA08000" />
+        <register type="NOA" address="0x00009888" value="0x0AA31880" />
+        <register type="NOA" address="0x00009888" value="0x0EA3003C" />
+        <register type="NOA" address="0x00009888" value="0x00A31E80" />
+        <register type="NOA" address="0x00009888" value="0x02A31900" />
+        <register type="NOA" address="0x00009888" value="0x04A31980" />
+        <register type="NOA" address="0x00009888" value="0x0E044055" />
+        <register type="NOA" address="0x00009888" value="0x10040141" />
+        <register type="NOA" address="0x00009888" value="0x0C045000" />
+        <register type="NOA" address="0x00009888" value="0x0E055000" />
+        <register type="NOA" address="0x00009888" value="0x14050050" />
+        <register type="NOA" address="0x00009888" value="0x04054000" />
+        <register type="NOA" address="0x00009888" value="0x06055000" />
+        <register type="NOA" address="0x00009888" value="0x08055000" />
+        <register type="NOA" address="0x00009888" value="0x0A051000" />
+        <register type="NOA" address="0x00009888" value="0x260600CC" />
+        <register type="NOA" address="0x00009888" value="0x24067E00" />
+        <register type="NOA" address="0x00009888" value="0x18123000" />
+        <register type="NOA" address="0x00009888" value="0x1A12000C" />
+        <register type="NOA" address="0x00009888" value="0x0212C000" />
+        <register type="NOA" address="0x00009888" value="0x0612C000" />
+        <register type="NOA" address="0x00009888" value="0x0A12C000" />
+        <register type="NOA" address="0x00009888" value="0x08138000" />
+        <register type="NOA" address="0x00009888" value="0x0A134000" />
+        <register type="NOA" address="0x00009888" value="0x0413A000" />
+        <register type="NOA" address="0x00009888" value="0x06132000" />
+        <register type="NOA" address="0x00009888" value="0x0A148000" />
+        <register type="NOA" address="0x00009888" value="0x0E144000" />
+        <register type="NOA" address="0x00009888" value="0x00148000" />
+        <register type="NOA" address="0x00009888" value="0x02148000" />
+        <register type="NOA" address="0x00009888" value="0x04148000" />
+        <register type="NOA" address="0x00009888" value="0x16150380" />
+        <register type="NOA" address="0x00009888" value="0x1815000D" />
+        <register type="NOA" address="0x00009888" value="0x02154000" />
+        <register type="NOA" address="0x00009888" value="0x0415C000" />
+        <register type="NOA" address="0x00009888" value="0x06154000" />
+        <register type="NOA" address="0x00009888" value="0x0815C000" />
+        <register type="NOA" address="0x00009888" value="0x0A154000" />
+        <register type="NOA" address="0x00009888" value="0x0C15C000" />
+        <register type="NOA" address="0x00009888" value="0x0A182000" />
+        <register type="NOA" address="0x00009888" value="0x0E188000" />
+        <register type="NOA" address="0x00009888" value="0x02182000" />
+        <register type="NOA" address="0x00009888" value="0x04182000" />
+        <register type="NOA" address="0x00009888" value="0x06182000" />
+        <register type="NOA" address="0x00009888" value="0x12190400" />
+        <register type="NOA" address="0x00009888" value="0x14190020" />
+        <register type="NOA" address="0x00009888" value="0x0A192000" />
+        <register type="NOA" address="0x00009888" value="0x0C192000" />
+        <register type="NOA" address="0x00009888" value="0x0E192000" />
+        <register type="NOA" address="0x00009888" value="0x0A1C8000" />
+        <register type="NOA" address="0x00009888" value="0x0E1C2000" />
+        <register type="NOA" address="0x00009888" value="0x001C8000" />
+        <register type="NOA" address="0x00009888" value="0x021C8000" />
+        <register type="NOA" address="0x00009888" value="0x041C8000" />
+        <register type="NOA" address="0x00009888" value="0x121D1000" />
+        <register type="NOA" address="0x00009888" value="0x141D0008" />
+        <register type="NOA" address="0x00009888" value="0x081D8000" />
+        <register type="NOA" address="0x00009888" value="0x0A1D8000" />
+        <register type="NOA" address="0x00009888" value="0x0C1D8000" />
+        <register type="NOA" address="0x00009884" value="0x00000003" />
+        <register type="NOA" address="0x00009888" value="0x1A1C01C0" />
+        <register type="NOA" address="0x00009888" value="0x1C1C000A" />
+        <register type="NOA" address="0x00009888" value="0x1A5C01C0" />
+        <register type="NOA" address="0x00009888" value="0x1C5C000A" />
+        <register type="NOA" address="0x00009888" value="0x001C0097" />
+        <register type="NOA" address="0x00009888" value="0x061C9400" />
+        <register type="NOA" address="0x00009888" value="0x0C1C00A7" />
+        <register type="NOA" address="0x00009888" value="0x101C0000" />
+        <register type="NOA" address="0x00009888" value="0x081D8100" />
+        <register type="NOA" address="0x00009888" value="0x0A1D0010" />
+        <register type="NOA" address="0x00009888" value="0x085C9497" />
+        <register type="NOA" address="0x00009888" value="0x0C5CA700" />
+        <register type="NOA" address="0x00009888" value="0x105C0000" />
+        <register type="NOA" address="0x00009888" value="0x0A5D0023" />
+        <register type="NOA" address="0x00009888" value="0x181E8000" />
+        <register type="NOA" address="0x00009888" value="0x1E1E0F80" />
+        <register type="NOA" address="0x00009888" value="0x201E000E" />
+        <register type="NOA" address="0x00009888" value="0x301F4000" />
+        <register type="NOA" address="0x00009888" value="0x501F2524" />
+        <register type="NOA" address="0x00009888" value="0x521F2522" />
+        <register type="NOA" address="0x00009888" value="0x541F0024" />
+        <register type="NOA" address="0x00009888" value="0x3A1F8000" />
+        <register type="NOA" address="0x00009888" value="0x4E1F2430" />
+        <register type="NOA" address="0x00009888" value="0x3E1F0300" />
+        <register type="NOA" address="0x00009888" value="0x461F0303" />
+        <register type="NOA" address="0x00009888" value="0x481F3003" />
+        <register type="NOA" address="0x00009888" value="0x4A1F0300" />
+        <register type="NOA" address="0x00009888" value="0x4C1F0003" />
+        <register type="NOA" address="0x00009888" value="0x181F0000" />
+        <register type="NOA" address="0x00009888" value="0x401F3000" />
+        <register type="NOA" address="0x00009888" value="0x421F3000" />
+        <register type="NOA" address="0x00009888" value="0x441F3000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E65C" value="0xFFFFFFFF" />
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00000003" />
+        <register type="FLEX" address="0x0000E658" value="0x00002001" />
+        <register type="FLEX" address="0x0000E758" value="0x00000008" />
+    </register_config>
+  </set>
+
+  <set name="ComputeExtended Gen11"
+       mdapi_supported_apis="VK OGL OGL4 OCL MEDIA IO BB"
+       underscore_name="compute_extended"
+       hw_config_guid="43eb7fc1-dc5e-45e2-a90a-0053f5397271"
+       chipset="ICL"
+       symbol_name="ComputeExtended"
+       >
+    <counter name="UntypedWritesPerCacheLine"
+             description="The ratio of EU untyped write requests to L3 cache line writes."
+             data_type="float"
+             equation="B 7 READ B 1 READ FADD C 2 READ FADD C 3 READ FDIV"
+             underscore_name="untyped_writes_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="UntypedWritesPerCacheLine"
+             availability="$SubsliceMask 1 AND"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Eu Typed Atomics 00"
+             description="Slice0 Dualsubslice 0 Eu Typed Atomics"
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="eu_typed_atomics00"
+             units="messages"
+             symbol_name="EuTypedAtomics00"
+             availability="$SubsliceMask 1 AND"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Typed Atomics 00"
+             description="Slice 0 Dualsubslice 0 typed atomics."
+             data_type="uint64"
+             equation="C 7 READ"
+             underscore_name="typed_atomics00"
+             units="messages"
+             symbol_name="TypedAtomics00"
+             availability="$SubsliceMask 1 AND"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="TypedAtomicsPerCacheLine"
+             description="The ratio of EU typed atomics requests to L3 cache line writes."
+             data_type="float"
+             equation="$EuTypedAtomics00 $TypedAtomics00 FDIV"
+             underscore_name="typed_atomics_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="TypedAtomicsPerCacheLine"
+             availability="$SubsliceMask 1 AND"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Eu 64 Untyped Reads 00"
+             description="Slice0 Dualsubslice 0 Eu 64 Untyped Reads"
+             data_type="float"
+             equation="B 5 READ C 1 READ FADD B 6 READ FADD"
+             underscore_name="eu_a64_untyped_reads00"
+             units="messages"
+             symbol_name="EuA64UntypedReads00"
+             availability="$SubsliceMask 1 AND"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Eu A32 Untyped Writes 00"
+             description="Slice0 Dualsubslice 0 Eu A32 Untyped Writes"
+             data_type="uint64"
+             equation="B 7 READ B 1 READ UADD"
+             underscore_name="eu_a32_untyped_writes00"
+             units="messages"
+             symbol_name="EuA32UntypedWrites00"
+             availability="$SubsliceMask 1 AND"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="Eu Typed Reads 00"
+             description="Slice0 Dualsubslice 0 Eu Typed Reads"
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="eu_typed_reads00"
+             units="messages"
+             symbol_name="EuTypedReads00"
+             availability="$SubsliceMask 1 AND"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Eu Typed Writes 00"
+             description="Slice0 Dualsubslice 0 Eu Typed Writes"
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="eu_typed_writes00"
+             units="messages"
+             symbol_name="EuTypedWrites00"
+             availability="$SubsliceMask 1 AND"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Typed Writes 00"
+             description="Slice 0 Dualsubslice 0 typed writes."
+             data_type="uint64"
+             equation="C 5 READ"
+             underscore_name="typed_writes00"
+             units="messages"
+             symbol_name="TypedWrites00"
+             availability="$SubsliceMask 1 AND"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="TypedWritesPerCacheLine"
+             description="The ratio of EU typed write requests to L3 cache line writes."
+             data_type="float"
+             equation="$EuTypedWrites00 $TypedWrites00 FDIV"
+             underscore_name="typed_writes_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="TypedWritesPerCacheLine"
+             availability="$SubsliceMask 1 AND"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Untyped Writes 00"
+             description="Slice 0 Dualsubslice 0 untyped writes (including SLM writes)."
+             data_type="uint64"
+             equation="C 3 READ"
+             underscore_name="untyped_writes00"
+             units="messages"
+             symbol_name="UntypedWrites00"
+             availability="$SubsliceMask 1 AND"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Untyped Reads 00"
+             description="Slice 0 Dualsubslice 0 untyped reads (including SLM reads)."
+             data_type="uint64"
+             equation="C 4 READ"
+             underscore_name="untyped_reads00"
+             units="messages"
+             symbol_name="UntypedReads00"
+             availability="$SubsliceMask 1 AND"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Eu A64 Untyped Writes 00"
+             description="Slice0 Dualsubslice 0 Eu A64 Untyped Writes"
+             data_type="uint64"
+             equation="C 2 READ"
+             underscore_name="eu_a64_untyped_writes00"
+             units="messages"
+             symbol_name="EuA64UntypedWrites00"
+             availability="$SubsliceMask 1 AND"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="UntypedReadsPerCacheLine"
+             description="The ratio of EU untyped read requests to L3 cache line reads."
+             data_type="float"
+             equation="B 0 READ B 5 READ C 1 READ FADD B 6 READ FADD FADD C 4 READ FDIV"
+             underscore_name="untyped_reads_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="UntypedReadsPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Typed Reads 00"
+             description="Slice 0 Dualsubslice 0 typed reads."
+             data_type="uint64"
+             equation="C 6 READ"
+             underscore_name="typed_reads00"
+             units="messages"
+             symbol_name="TypedReads00"
+             availability="$SubsliceMask 1 AND"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="TypedReadsPerCacheLine"
+             description="The ratio of EU typed read requests to L3 cache line reads."
+             data_type="float"
+             equation="$EuTypedReads00 $TypedReads00 FDIV"
+             underscore_name="typed_reads_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="TypedReadsPerCacheLine"
+             availability="$SubsliceMask 1 AND"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Eu A32 Untyped Reads 00"
+             description="Slice0 Dualsubslice 0 Eu A32 Untyped Reads"
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="eu_a32_untyped_reads00"
+             units="messages"
+             symbol_name="EuA32UntypedReads00"
+             availability="$SubsliceMask 1 AND"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009840" value="0x00000000" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x1222000B" />
+        <register type="NOA" address="0x00009888" value="0x16220009" />
+        <register type="NOA" address="0x00009888" value="0x12230019" />
+        <register type="NOA" address="0x00009888" value="0x10230012" />
+        <register type="NOA" address="0x00009888" value="0x101E8000" />
+        <register type="NOA" address="0x00009888" value="0x1A1EF800" />
+        <register type="NOA" address="0x00009888" value="0x1C1E0007" />
+        <register type="NOA" address="0x00009888" value="0x001F8000" />
+        <register type="NOA" address="0x00009888" value="0x0C1FF800" />
+        <register type="NOA" address="0x00009888" value="0x0E1F0007" />
+        <register type="NOA" address="0x00009888" value="0x00204000" />
+        <register type="NOA" address="0x00009888" value="0x0E204000" />
+        <register type="NOA" address="0x00009888" value="0x1A202AA0" />
+        <register type="NOA" address="0x00009888" value="0x1C200005" />
+        <register type="NOA" address="0x00009888" value="0x04208000" />
+        <register type="NOA" address="0x00009888" value="0x06208000" />
+        <register type="NOA" address="0x00009888" value="0x08208000" />
+        <register type="NOA" address="0x00009888" value="0x0A208000" />
+        <register type="NOA" address="0x00009888" value="0x0C208000" />
+        <register type="NOA" address="0x00009888" value="0x00214000" />
+        <register type="NOA" address="0x00009888" value="0x0E214000" />
+        <register type="NOA" address="0x00009888" value="0x14214000" />
+        <register type="NOA" address="0x00009888" value="0x16210555" />
+        <register type="NOA" address="0x00009888" value="0x00220011" />
+        <register type="NOA" address="0x00009888" value="0x06220900" />
+        <register type="NOA" address="0x00009888" value="0x08220A13" />
+        <register type="NOA" address="0x00009888" value="0x0A220B15" />
+        <register type="NOA" address="0x00009888" value="0x0C222317" />
+        <register type="NOA" address="0x00009888" value="0x0E220043" />
+        <register type="NOA" address="0x00009888" value="0x02231AB4" />
+        <register type="NOA" address="0x00009888" value="0x04231DBA" />
+        <register type="NOA" address="0x00009888" value="0x06230039" />
+        <register type="NOA" address="0x00009888" value="0x00230000" />
+        <register type="NOA" address="0x00009888" value="0x0C044400" />
+        <register type="NOA" address="0x00009888" value="0x0E045555" />
+        <register type="NOA" address="0x00009888" value="0x10040055" />
+        <register type="NOA" address="0x00009888" value="0x04051000" />
+        <register type="NOA" address="0x00009888" value="0x0A055000" />
+        <register type="NOA" address="0x00009888" value="0x0C055000" />
+        <register type="NOA" address="0x00009888" value="0x0E055000" />
+        <register type="NOA" address="0x00009888" value="0x14050015" />
+        <register type="NOA" address="0x00009888" value="0x06055000" />
+        <register type="NOA" address="0x00009888" value="0x08055000" />
+        <register type="NOA" address="0x00009888" value="0x2406FD00" />
+        <register type="NOA" address="0x00009888" value="0x2606007F" />
+        <register type="NOA" address="0x00009888" value="0x0015C000" />
+        <register type="NOA" address="0x00009888" value="0x0E15C000" />
+        <register type="NOA" address="0x00009888" value="0x16157FF8" />
+        <register type="NOA" address="0x00009888" value="0x18150003" />
+        <register type="NOA" address="0x00009888" value="0x0415C000" />
+        <register type="NOA" address="0x00009888" value="0x0615C000" />
+        <register type="NOA" address="0x00009888" value="0x0815C000" />
+        <register type="NOA" address="0x00009888" value="0x0A15C000" />
+        <register type="NOA" address="0x00009888" value="0x0C15C000" />
+        <register type="NOA" address="0x00009888" value="0x00182000" />
+        <register type="NOA" address="0x00009888" value="0x0618A000" />
+        <register type="NOA" address="0x00009888" value="0x0818A000" />
+        <register type="NOA" address="0x00009888" value="0x0A18A000" />
+        <register type="NOA" address="0x00009888" value="0x0C18A000" />
+        <register type="NOA" address="0x00009888" value="0x0E182000" />
+        <register type="NOA" address="0x00009888" value="0x0218A000" />
+        <register type="NOA" address="0x00009888" value="0x0418A000" />
+        <register type="NOA" address="0x00009888" value="0x08192000" />
+        <register type="NOA" address="0x00009888" value="0x0E19A000" />
+        <register type="NOA" address="0x00009888" value="0x12195540" />
+        <register type="NOA" address="0x00009888" value="0x1419000A" />
+        <register type="NOA" address="0x00009888" value="0x0A19A000" />
+        <register type="NOA" address="0x00009888" value="0x0C19A000" />
+        <register type="NOA" address="0x00009884" value="0x00000003" />
+        <register type="NOA" address="0x00009888" value="0x16136860" />
+        <register type="NOA" address="0x00009888" value="0x24000004" />
+        <register type="NOA" address="0x00009888" value="0x20000040" />
+        <register type="NOA" address="0x00009888" value="0x0E132980" />
+        <register type="NOA" address="0x00009888" value="0x00132D80" />
+        <register type="NOA" address="0x00009888" value="0x10130000" />
+        <register type="NOA" address="0x00009888" value="0x1A130000" />
+        <register type="NOA" address="0x00009888" value="0x02130000" />
+        <register type="NOA" address="0x00009888" value="0x301F8000" />
+        <register type="NOA" address="0x00009888" value="0x501F4924" />
+        <register type="NOA" address="0x00009888" value="0x521F4924" />
+        <register type="NOA" address="0x00009888" value="0x541F000C" />
+        <register type="NOA" address="0x00009888" value="0x3A1F2000" />
+        <register type="NOA" address="0x00009888" value="0x4E1F2413" />
+        <register type="NOA" address="0x00009888" value="0x3E1F0000" />
+        <register type="NOA" address="0x00009888" value="0x461F0000" />
+        <register type="NOA" address="0x00009888" value="0x481F0000" />
+        <register type="NOA" address="0x00009888" value="0x4A1F0000" />
+        <register type="NOA" address="0x00009888" value="0x4C1F0000" />
+        <register type="NOA" address="0x00009888" value="0x181F0000" />
+        <register type="NOA" address="0x00009888" value="0x401F3013" />
+        <register type="NOA" address="0x00009888" value="0x421F3030" />
+        <register type="NOA" address="0x00009888" value="0x441F3030" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002770" value="0x30000036" />
+        <register type="OA" address="0x00002774" value="0x01FFFE00" />
+        <register type="OA" address="0x00002778" value="0x31000034" />
+        <register type="OA" address="0x0000277C" value="0x01FFFE00" />
+        <register type="OA" address="0x00002780" value="0x00000C9A" />
+        <register type="OA" address="0x00002784" value="0x0000FE00" />
+        <register type="OA" address="0x00002788" value="0x00000C92" />
+        <register type="OA" address="0x0000278C" value="0x0000FE00" />
+        <register type="OA" address="0x00002790" value="0x00000CA2" />
+        <register type="OA" address="0x00002794" value="0x0000FE00" />
+        <register type="OA" address="0x00002798" value="0x00000E42" />
+        <register type="OA" address="0x0000279C" value="0x0000FE00" />
+        <register type="OA" address="0x000027A0" value="0x00000E6A" />
+        <register type="OA" address="0x000027A4" value="0x0000FE00" />
+        <register type="OA" address="0x000027A8" value="0x00000C32" />
+        <register type="OA" address="0x000027AC" value="0x0000FE00" />
+        <register type="OA" address="0x0000274C" value="0x87643210" />
+        <register type="OA" address="0x00002744" value="0x00001811" />
+        <register type="OA" address="0x00002748" value="0x87654310" />
+    </register_config>
+  </set>
+
+  <set name="Compute Metrics L3 Cache Gen11"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="compute_l3_cache"
+       hw_config_guid="05d5e01f-0800-4975-b36b-7b169cad3fab"
+       chipset="ICL"
+       symbol_name="ComputeL3Cache"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank3 Accesses"
+             description="The total number of accesses to Slice0 L3 Bank3."
+             data_type="uint64"
+             equation="C 4 READ 2 UMUL"
+             underscore_name="l3_bank03_accesses"
+             units="messages"
+             symbol_name="L3Bank03Accesses"
+             availability="$SliceMask 1 AND"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="Slice0 L3 Bank0 Accesses"
+             description="The total number of accesses to Slice0 L3 Bank0."
+             data_type="uint64"
+             equation="C 7 READ 2 UMUL"
+             underscore_name="l3_bank00_accesses"
+             units="messages"
+             symbol_name="L3Bank00Accesses"
+             availability="$SliceMask 1 AND"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="Slice0 L3 Bank1 Accesses"
+             description="The total number of accesses to Slice0 L3 Bank1."
+             data_type="uint64"
+             equation="C 6 READ 2 UMUL"
+             underscore_name="l3_bank01_accesses"
+             units="messages"
+             symbol_name="L3Bank01Accesses"
+             availability="$SliceMask 1 AND"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="Slice0 L3 Bank2 Accesses"
+             description="The total number of accesses to Slice0 L3 Bank2."
+             data_type="uint64"
+             equation="C 5 READ 2 UMUL"
+             underscore_name="l3_bank02_accesses"
+             units="messages"
+             symbol_name="L3Bank02Accesses"
+             availability="$SliceMask 1 AND"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="Slice0 L3 Bank4 Accesses"
+             description="The total number of accesses to Slice0 L3 Bank4."
+             data_type="uint64"
+             equation="C 3 READ 2 UMUL"
+             underscore_name="l3_bank04_accesses"
+             units="messages"
+             symbol_name="L3Bank04Accesses"
+             availability="$SliceMask 1 AND"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="Slice0 L3 Bank5 Accesses"
+             description="The total number of accesses to Slice0 L3 Bank5."
+             data_type="uint64"
+             equation="C 2 READ 2 UMUL"
+             underscore_name="l3_bank05_accesses"
+             units="messages"
+             symbol_name="L3Bank05Accesses"
+             availability="$SliceMask 1 AND"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="Slice0 L3 Bank6 Accesses"
+             description="The total number of accesses to Slice0 L3 Bank6."
+             data_type="uint64"
+             equation="C 1 READ 2 UMUL"
+             underscore_name="l3_bank06_accesses"
+             units="messages"
+             symbol_name="L3Bank06Accesses"
+             availability="$SliceMask 1 AND"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="Slice0 L3 Bank7 Accesses"
+             description="The total number of accesses to Slice0 L3 Bank7."
+             data_type="uint64"
+             equation="C 0 READ 2 UMUL"
+             underscore_name="l3_bank07_accesses"
+             units="messages"
+             symbol_name="L3Bank07Accesses"
+             availability="$SliceMask 1 AND"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="L3 Accesses"
+             description="The total number of L3 accesses from all entities."
+             data_type="uint64"
+             equation="$L3Bank00Accesses $L3Bank01Accesses UADD $L3Bank02Accesses UADD $L3Bank03Accesses UADD $L3Bank04Accesses UADD $L3Bank05Accesses UADD $L3Bank06Accesses UADD $L3Bank07Accesses UADD"
+             underscore_name="l3_accesses"
+             units="messages"
+             symbol_name="L3Accesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Sampler Throughput"
+             description="The total number of GPU memory bytes transferred between samplers and L3 caches."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="64  B 7 READ B 6 READ UADD 2 UMUL UMUL"
+             underscore_name="l3_sampler_throughput"
+             units="bytes"
+             symbol_name="L3SamplerThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Sampler"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU AVG IPC Rate"
+             description="The average rate of IPC calculated for 2 FPU pipelines."
+             data_type="float"
+             max_equation="2"
+             equation="A 9 READ A 10 READ A 11 READ FADD A 9 READ FSUB FDIV 1 FADD"
+             underscore_name="eu_avg_ipc_rate"
+             units="number"
+             symbol_name="EuAvgIpcRate"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Binary Instruction"
+             description="The percentage of time in which execution units were actively processing binary instructions on FPU0."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_binary_fpu0_instruction"
+             units="percent"
+             symbol_name="EuBinaryFpu0Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="EU FPU0 Hybrid Instruction"
+             description="The percentage of time in which execution units were actively processing hybrid instructions on FPU0."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_hybrid_fpu0_instruction"
+             units="percent"
+             symbol_name="EuHybridFpu0Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active"
+             units="percent"
+             symbol_name="Fpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu0_active"
+             units="percent"
+             symbol_name="Fpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="EU FPU0 Move Instruction"
+             description="The percentage of time in which execution units were actively processing move instructions on FPU0."
+             data_type="float"
+             max_equation="100"
+             equation="A 19 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_move_fpu0_instruction"
+             units="percent"
+             symbol_name="EuMoveFpu0Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Accesses"
+             description="The total number of messages send to samplers."
+             data_type="uint64"
+             equation="A 28 READ"
+             underscore_name="sampler_accesses"
+             units="messages"
+             symbol_name="SamplerAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="$SamplerAccesses 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU FPU1 Hybrid Instruction"
+             description="The percentage of time in which execution units were actively processing hybrid instructions on FPU1."
+             data_type="float"
+             max_equation="100"
+             equation="A 14 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_hybrid_fpu1_instruction"
+             units="percent"
+             symbol_name="EuHybridFpu1Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="L3 Lookup Accesses w/o IC"
+             description="The total number of L3 cache lookup accesses w/o IC."
+             data_type="uint64"
+             equation="B 7 READ B 6 READ UADD 2 UMUL A 32 READ UADD"
+             underscore_name="l3_lookups"
+             units="messages"
+             symbol_name="L3Lookups"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/TAG"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Read Throughput"
+             description="The total number of GPU memory bytes read from GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="B 2 READ 64 UMUL"
+             underscore_name="gti_read_throughput"
+             units="bytes"
+             symbol_name="GtiReadThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Ternary Instruction"
+             description="The percentage of time in which execution units were actively processing ternary instructions on FPU0."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_ternary_fpu0_instruction"
+             units="percent"
+             symbol_name="EuTernaryFpu0Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU FPU1 Move Instruction"
+             description="The percentage of time in which execution units were actively processing move instructions on FPU1."
+             data_type="float"
+             max_equation="100"
+             equation="A 20 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_move_fpu1_instruction"
+             units="percent"
+             symbol_name="EuMoveFpu1Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="L3 Total Throughput"
+             description="The total number of GPU memory bytes transferred via L3."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="$L3Accesses 64 UMUL"
+             underscore_name="l3_total_throughput"
+             units="bytes"
+             symbol_name="L3TotalThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Write Throughput"
+             description="The total number of GPU memory bytes written to GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="B 3 READ 64 UMUL"
+             underscore_name="gti_write_throughput"
+             units="bytes"
+             symbol_name="GtiWriteThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="$ShaderMemoryAccesses 64 UMUL"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Binary Instruction"
+             description="The percentage of time in which execution units were actively processing binary instructions on FPU1."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_binary_fpu1_instruction"
+             units="percent"
+             symbol_name="EuBinaryFpu1Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Ternary Instruction"
+             description="The percentage of time in which execution units were actively processing ternary instructions on FPU1."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_ternary_fpu1_instruction"
+             units="percent"
+             symbol_name="EuTernaryFpu1Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_send_active"
+             units="percent"
+             symbol_name="EuSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009840" value="0x00000000" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x14120700" />
+        <register type="NOA" address="0x00009888" value="0x121500E0" />
+        <register type="NOA" address="0x00009888" value="0x10040154" />
+        <register type="NOA" address="0x00009888" value="0x0C045000" />
+        <register type="NOA" address="0x00009888" value="0x0E040055" />
+        <register type="NOA" address="0x00009888" value="0x14050055" />
+        <register type="NOA" address="0x00009888" value="0x04054000" />
+        <register type="NOA" address="0x00009888" value="0x06055000" />
+        <register type="NOA" address="0x00009888" value="0x08055000" />
+        <register type="NOA" address="0x00009888" value="0x0A051000" />
+        <register type="NOA" address="0x00009888" value="0x260600F0" />
+        <register type="NOA" address="0x00009888" value="0x24067E00" />
+        <register type="NOA" address="0x00009888" value="0x0C120023" />
+        <register type="NOA" address="0x00009888" value="0x0E12152B" />
+        <register type="NOA" address="0x00009888" value="0x00121480" />
+        <register type="NOA" address="0x00009888" value="0x02120028" />
+        <register type="NOA" address="0x00009888" value="0x10120000" />
+        <register type="NOA" address="0x00009888" value="0x18120000" />
+        <register type="NOA" address="0x00009888" value="0x1A120000" />
+        <register type="NOA" address="0x00009888" value="0x04120000" />
+        <register type="NOA" address="0x00009888" value="0x0A13D000" />
+        <register type="NOA" address="0x00009888" value="0x04136000" />
+        <register type="NOA" address="0x00009888" value="0x0C144000" />
+        <register type="NOA" address="0x00009888" value="0x0E14C000" />
+        <register type="NOA" address="0x00009888" value="0x00148000" />
+        <register type="NOA" address="0x00009888" value="0x02144000" />
+        <register type="NOA" address="0x00009888" value="0x0C150980" />
+        <register type="NOA" address="0x00009888" value="0x02154D80" />
+        <register type="NOA" address="0x00009888" value="0x04154C9A" />
+        <register type="NOA" address="0x00009888" value="0x06150018" />
+        <register type="NOA" address="0x00009888" value="0x10150000" />
+        <register type="NOA" address="0x00009888" value="0x16150800" />
+        <register type="NOA" address="0x00009888" value="0x18150005" />
+        <register type="NOA" address="0x00009888" value="0x08150000" />
+        <register type="NOA" address="0x00009888" value="0x0A150000" />
+        <register type="NOA" address="0x00009884" value="0x00000003" />
+        <register type="NOA" address="0x00009888" value="0x1217241C" />
+        <register type="NOA" address="0x00009888" value="0x22000050" />
+        <register type="NOA" address="0x00009888" value="0x18133C00" />
+        <register type="NOA" address="0x00009888" value="0x081710B0" />
+        <register type="NOA" address="0x00009888" value="0x10170000" />
+        <register type="NOA" address="0x00009888" value="0x501F1124" />
+        <register type="NOA" address="0x00009888" value="0x521F4801" />
+        <register type="NOA" address="0x00009888" value="0x541F0024" />
+        <register type="NOA" address="0x00009888" value="0x3A1F8000" />
+        <register type="NOA" address="0x00009888" value="0x4E1F2400" />
+        <register type="NOA" address="0x00009888" value="0x461F3100" />
+        <register type="NOA" address="0x00009888" value="0x481F0031" />
+        <register type="NOA" address="0x00009888" value="0x4A1F0000" />
+        <register type="NOA" address="0x00009888" value="0x4C1F0030" />
+        <register type="NOA" address="0x00009888" value="0x181F0000" />
+        <register type="NOA" address="0x00009888" value="0x301F0000" />
+        <register type="NOA" address="0x00009888" value="0x401F0000" />
+        <register type="NOA" address="0x00009888" value="0x421F3030" />
+        <register type="NOA" address="0x00009888" value="0x441F3030" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00000003" />
+        <register type="FLEX" address="0x0000E658" value="0x00002001" />
+        <register type="FLEX" address="0x0000E758" value="0x00101100" />
+        <register type="FLEX" address="0x0000E45C" value="0x00201200" />
+        <register type="FLEX" address="0x0000E55C" value="0x00301300" />
+        <register type="FLEX" address="0x0000E65C" value="0x00401400" />
+    </register_config>
+  </set>
+
+  <set name="Render Metrics for 3D Pipeline Profile Gen11"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="render_pipe_profile"
+       hw_config_guid="03c7a167-2abc-4ba6-878a-f1d80082abca"
+       chipset="ICL"
+       symbol_name="RenderPipeProfile"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Bottleneck"
+             low_watermark="10"
+             description="The percentage of time in which vertex shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="30"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="vs_bottleneck"
+             units="percent"
+             symbol_name="VsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Hi-Depth Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which early hierarchical depth test pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="B 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="hi_depth_bottleneck"
+             units="percent"
+             symbol_name="HiDepthBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which geometry shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="C 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="gs_bottleneck"
+             units="percent"
+             symbol_name="GsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Geometry Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="BC Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which barycentric coordinates calculation pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="B 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="bc_bottleneck"
+             units="percent"
+             symbol_name="BcBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Barycentric Calc"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HS Stall"
+             description="The percentage of time in which hull stall pipeline stage was stalled."
+             data_type="float"
+             max_equation="100"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="hs_stall"
+             units="percent"
+             symbol_name="HsStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_group="3D Pipe/Hull Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="VF Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which vertex fetch pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="vf_bottleneck"
+             units="percent"
+             symbol_name="VfBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Input Assembler"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Strip-Fans Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which strip-fans pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="10"
+             equation="C 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="sf_bottleneck"
+             units="percent"
+             symbol_name="SfBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Strip-Fans"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SF Stall"
+             description="The percentage of time in which strip-fans pipeline stage was stalled."
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sf_stall"
+             units="percent"
+             symbol_name="SfStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Strip-Fans"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HS Bottleneck"
+             low_watermark="3"
+             description="The percentage of time in which hull shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="9"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="hs_bottleneck"
+             units="percent"
+             symbol_name="HsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Hull Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="CL Stall"
+             description="The percentage of time in which clipper pipeline stage was stalled."
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="cl_stall"
+             units="percent"
+             symbol_name="ClStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_group="3D Pipe/Clipper"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SO Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which stream output pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="C 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="so_bottleneck"
+             units="percent"
+             symbol_name="SoBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Stream Output"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="DS Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which domain shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="ds_bottleneck"
+             units="percent"
+             symbol_name="DsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Domain Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Clipper Bottleneck"
+             low_watermark="10"
+             description="The percentage of time in which clipper pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="30"
+             equation="C 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="cl_bottleneck"
+             units="percent"
+             symbol_name="ClBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Clipper"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Stall"
+             description="The percentage of time in which domain shader pipeline stage was stalled."
+             data_type="float"
+             max_equation="100"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ds_stall"
+             units="percent"
+             symbol_name="DsStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_group="3D Pipe/Domain Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Early Depth Bottleneck"
+             low_watermark="10"
+             description="The percentage of time in which early depth test pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="30"
+             equation="B 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="early_depth_bottleneck"
+             units="percent"
+             symbol_name="EarlyDepthBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="$ShaderMemoryAccesses 64 UMUL"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SO Stall"
+             description="The percentage of time in which stream-output pipeline stage was stalled."
+             data_type="float"
+             max_equation="100"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="so_stall"
+             units="percent"
+             symbol_name="SoStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_group="3D Pipe/Stream Output"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009840" value="0x00000000" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x001F001E" />
+        <register type="NOA" address="0x00009888" value="0x10160000" />
+        <register type="NOA" address="0x00009888" value="0x1017001F" />
+        <register type="NOA" address="0x00009888" value="0x0A1F0005" />
+        <register type="NOA" address="0x00009888" value="0x0E1F0000" />
+        <register type="NOA" address="0x00009888" value="0x0C1F0000" />
+        <register type="NOA" address="0x00009888" value="0x1A200800" />
+        <register type="NOA" address="0x00009888" value="0x10040015" />
+        <register type="NOA" address="0x00009888" value="0x0E054000" />
+        <register type="NOA" address="0x00009888" value="0x14050005" />
+        <register type="NOA" address="0x00009888" value="0x26060038" />
+        <register type="NOA" address="0x00009888" value="0x16157E00" />
+        <register type="NOA" address="0x00009888" value="0x0C160022" />
+        <register type="NOA" address="0x00009888" value="0x08160000" />
+        <register type="NOA" address="0x00009888" value="0x0C170540" />
+        <register type="NOA" address="0x00009888" value="0x04170000" />
+        <register type="NOA" address="0x00009888" value="0x0A188000" />
+        <register type="NOA" address="0x00009888" value="0x0C181000" />
+        <register type="NOA" address="0x00009888" value="0x12195000" />
+        <register type="NOA" address="0x00009888" value="0x14190001" />
+        <register type="NOA" address="0x00009884" value="0x00000003" />
+        <register type="NOA" address="0x00009888" value="0x12010000" />
+        <register type="NOA" address="0x00009888" value="0x100B7C00" />
+        <register type="NOA" address="0x00009888" value="0x100F0019" />
+        <register type="NOA" address="0x00009888" value="0x10107C00" />
+        <register type="NOA" address="0x00009888" value="0x16100000" />
+        <register type="NOA" address="0x00009888" value="0x00110000" />
+        <register type="NOA" address="0x00009888" value="0x120703C0" />
+        <register type="NOA" address="0x00009888" value="0x10090000" />
+        <register type="NOA" address="0x00009888" value="0x06010080" />
+        <register type="NOA" address="0x00009888" value="0x0E014180" />
+        <register type="NOA" address="0x00009888" value="0x10010000" />
+        <register type="NOA" address="0x00009888" value="0x00014000" />
+        <register type="NOA" address="0x00009888" value="0x060B0015" />
+        <register type="NOA" address="0x00009888" value="0x080B8000" />
+        <register type="NOA" address="0x00009888" value="0x0A0B2000" />
+        <register type="NOA" address="0x00009888" value="0x020BA000" />
+        <register type="NOA" address="0x00009888" value="0x040BA000" />
+        <register type="NOA" address="0x00009888" value="0x0E0E0A02" />
+        <register type="NOA" address="0x00009888" value="0x0C0EA800" />
+        <register type="NOA" address="0x00009888" value="0x020F0002" />
+        <register type="NOA" address="0x00009888" value="0x180F0800" />
+        <register type="NOA" address="0x00009888" value="0x040F0000" />
+        <register type="NOA" address="0x00009888" value="0x060F8000" />
+        <register type="NOA" address="0x00009888" value="0x0A100017" />
+        <register type="NOA" address="0x00009888" value="0x04107113" />
+        <register type="NOA" address="0x00009888" value="0x18100020" />
+        <register type="NOA" address="0x00009888" value="0x06104000" />
+        <register type="NOA" address="0x00009888" value="0x08100000" />
+        <register type="NOA" address="0x00009888" value="0x08110C40" />
+        <register type="NOA" address="0x00009888" value="0x02110C80" />
+        <register type="NOA" address="0x00009888" value="0x00024000" />
+        <register type="NOA" address="0x00009888" value="0x06028000" />
+        <register type="NOA" address="0x00009888" value="0x0E02C000" />
+        <register type="NOA" address="0x00009888" value="0x00039000" />
+        <register type="NOA" address="0x00009888" value="0x06036000" />
+        <register type="NOA" address="0x00009888" value="0x0803A000" />
+        <register type="NOA" address="0x00009888" value="0x0A032000" />
+        <register type="NOA" address="0x00009888" value="0x0E035000" />
+        <register type="NOA" address="0x00009888" value="0x0203A000" />
+        <register type="NOA" address="0x00009888" value="0x0403A000" />
+        <register type="NOA" address="0x00009888" value="0x00044000" />
+        <register type="NOA" address="0x00009888" value="0x0E044000" />
+        <register type="NOA" address="0x00009888" value="0x10068000" />
+        <register type="NOA" address="0x00009888" value="0x12068000" />
+        <register type="NOA" address="0x00009888" value="0x14068000" />
+        <register type="NOA" address="0x00009888" value="0x02068000" />
+        <register type="NOA" address="0x00009888" value="0x04068000" />
+        <register type="NOA" address="0x00009888" value="0x06068000" />
+        <register type="NOA" address="0x00009888" value="0x08068000" />
+        <register type="NOA" address="0x00009888" value="0x0A068000" />
+        <register type="NOA" address="0x00009888" value="0x0C068000" />
+        <register type="NOA" address="0x00009888" value="0x00070032" />
+        <register type="NOA" address="0x00009888" value="0x0E070033" />
+        <register type="NOA" address="0x00009888" value="0x04070000" />
+        <register type="NOA" address="0x00009888" value="0x08098011" />
+        <register type="NOA" address="0x00009888" value="0x00090980" />
+        <register type="NOA" address="0x00009888" value="0x18090A00" />
+        <register type="NOA" address="0x00009888" value="0x02090000" />
+        <register type="NOA" address="0x00009888" value="0x04098000" />
+        <register type="NOA" address="0x00009888" value="0x06098000" />
+        <register type="NOA" address="0x00009888" value="0x0A098000" />
+        <register type="NOA" address="0x00009888" value="0x0C098000" />
+        <register type="NOA" address="0x00009888" value="0x301F6000" />
+        <register type="NOA" address="0x00009888" value="0x501F36DB" />
+        <register type="NOA" address="0x00009888" value="0x521F491B" />
+        <register type="NOA" address="0x00009888" value="0x541F001B" />
+        <register type="NOA" address="0x00009888" value="0x3A1F6000" />
+        <register type="NOA" address="0x00009888" value="0x4E1F1B41" />
+        <register type="NOA" address="0x00009888" value="0x3E1F2100" />
+        <register type="NOA" address="0x00009888" value="0x461F4141" />
+        <register type="NOA" address="0x00009888" value="0x481F1160" />
+        <register type="NOA" address="0x00009888" value="0x4A1F1000" />
+        <register type="NOA" address="0x00009888" value="0x4C1F2120" />
+        <register type="NOA" address="0x00009888" value="0x181F0000" />
+        <register type="NOA" address="0x00009888" value="0x401F0141" />
+        <register type="NOA" address="0x00009888" value="0x421F1160" />
+        <register type="NOA" address="0x00009888" value="0x441F3111" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+    </register_config>
+  </set>
+
+  <set name="Metric set HDCAndSF"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="hdc_and_sf"
+       hw_config_guid="c5cbc488-6569-41dd-9128-42bf6f0d317c"
+       chipset="ICL"
+       symbol_name="HDCAndSF"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="Polygon Data Ready"
+             description="The percentage of time in which geometry pipeline output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="poly_data_ready"
+             units="percent"
+             symbol_name="PolyDataReady"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe/Strip-Fans"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="Slice0 Dualsubslice1 Non-sampler Shader Access Stalled On L3"
+             description="Percentage of time when HDC has messages to L3, but it's stalled due to lack of credits (Slice0 Dualsubslice1)"
+             data_type="float"
+             max_equation="100"
+             equation="C 2 READ C 1 READ FSUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader01_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader01AccessStalledOnL3"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="Slice0 Dualsubslice2 Non-sampler Shader Access Stalled On L3"
+             description="Percentage of time when HDC has messages to L3, but it's stalled due to lack of credits (Slice0 Dualsubslice2)"
+             data_type="float"
+             max_equation="100"
+             equation="C 4 READ C 3 READ FSUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader02_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader02AccessStalledOnL3"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="$ShaderMemoryAccesses 64 UMUL"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Slice0 Dualsubslice0 Non-sampler Shader Access Stalled On L3"
+             description="Percentage of time when HDC has messages to L3, but it's stalled due to lack of credits (Slice0 Dualsubslice0)"
+             data_type="float"
+             max_equation="100"
+             equation="C 0 READ B 7 READ FSUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader00_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader00AccessStalledOnL3"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 Dualsubslice3 Non-sampler Shader Access Stalled On L3"
+             description="Percentage of time when HDC has messages to L3, but it's stalled due to lack of credits (Slice0 Dualsubslice3)"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ C 5 READ FSUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader03_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader03AccessStalledOnL3"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009840" value="0x00000000" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x1223000A" />
+        <register type="NOA" address="0x00009888" value="0x10230009" />
+        <register type="NOA" address="0x00009888" value="0x1263000A" />
+        <register type="NOA" address="0x00009888" value="0x10630009" />
+        <register type="NOA" address="0x00009888" value="0x12A3000A" />
+        <register type="NOA" address="0x00009888" value="0x10A30009" />
+        <register type="NOA" address="0x00009888" value="0x12E3000A" />
+        <register type="NOA" address="0x00009888" value="0x10E30009" />
+        <register type="NOA" address="0x00009888" value="0x10150019" />
+        <register type="NOA" address="0x00009888" value="0x1C20000A" />
+        <register type="NOA" address="0x00009888" value="0x0C231900" />
+        <register type="NOA" address="0x00009888" value="0x0E23003C" />
+        <register type="NOA" address="0x00009888" value="0x00230000" />
+        <register type="NOA" address="0x00009888" value="0x1C600020" />
+        <register type="NOA" address="0x00009888" value="0x02608000" />
+        <register type="NOA" address="0x00009888" value="0x0E631900" />
+        <register type="NOA" address="0x00009888" value="0x00631E00" />
+        <register type="NOA" address="0x00009888" value="0x04A08000" />
+        <register type="NOA" address="0x00009888" value="0x06A08000" />
+        <register type="NOA" address="0x00009888" value="0x02A31E32" />
+        <register type="NOA" address="0x00009888" value="0x00A30000" />
+        <register type="NOA" address="0x00009888" value="0x08E08000" />
+        <register type="NOA" address="0x00009888" value="0x0AE08000" />
+        <register type="NOA" address="0x00009888" value="0x04E31E32" />
+        <register type="NOA" address="0x00009888" value="0x00E30000" />
+        <register type="NOA" address="0x00009888" value="0x0C045400" />
+        <register type="NOA" address="0x00009888" value="0x10040150" />
+        <register type="NOA" address="0x00009888" value="0x0E040015" />
+        <register type="NOA" address="0x00009888" value="0x04055000" />
+        <register type="NOA" address="0x00009888" value="0x14050054" />
+        <register type="NOA" address="0x00009888" value="0x06055000" />
+        <register type="NOA" address="0x00009888" value="0x08055000" />
+        <register type="NOA" address="0x00009888" value="0x24063F00" />
+        <register type="NOA" address="0x00009888" value="0x260600E0" />
+        <register type="NOA" address="0x00009888" value="0x0E088000" />
+        <register type="NOA" address="0x00009888" value="0x00088000" />
+        <register type="NOA" address="0x00009888" value="0x14090040" />
+        <register type="NOA" address="0x00009888" value="0x04094000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x080E5000" />
+        <register type="NOA" address="0x00009888" value="0x1A120020" />
+        <register type="NOA" address="0x00009888" value="0x02128000" />
+        <register type="NOA" address="0x00009888" value="0x0412C000" />
+        <register type="NOA" address="0x00009888" value="0x0612C000" />
+        <register type="NOA" address="0x00009888" value="0x0A138000" />
+        <register type="NOA" address="0x00009888" value="0x0413E000" />
+        <register type="NOA" address="0x00009888" value="0x0E148000" />
+        <register type="NOA" address="0x00009888" value="0x00148000" />
+        <register type="NOA" address="0x00009888" value="0x0214C000" />
+        <register type="NOA" address="0x00009888" value="0x00150047" />
+        <register type="NOA" address="0x00009888" value="0x16156000" />
+        <register type="NOA" address="0x00009888" value="0x18150007" />
+        <register type="NOA" address="0x00009888" value="0x02154000" />
+        <register type="NOA" address="0x00009888" value="0x04154000" />
+        <register type="NOA" address="0x00009888" value="0x06154000" />
+        <register type="NOA" address="0x00009888" value="0x08158000" />
+        <register type="NOA" address="0x00009888" value="0x0A158000" />
+        <register type="NOA" address="0x00009888" value="0x0C188000" />
+        <register type="NOA" address="0x00009888" value="0x0E182000" />
+        <register type="NOA" address="0x00009888" value="0x1419000A" />
+        <register type="NOA" address="0x00009888" value="0x021CA000" />
+        <register type="NOA" address="0x00009888" value="0x0A1DA000" />
+        <register type="NOA" address="0x00009884" value="0x00000003" />
+        <register type="NOA" address="0x00009888" value="0x1C1F3061" />
+        <register type="NOA" address="0x00009888" value="0x181F0000" />
+        <register type="NOA" address="0x00009888" value="0x301F8000" />
+        <register type="NOA" address="0x00009888" value="0x521F4000" />
+        <register type="NOA" address="0x00009888" value="0x541F0024" />
+        <register type="NOA" address="0x00009888" value="0x3A1F8000" />
+        <register type="NOA" address="0x00009888" value="0x4E1F2400" />
+        <register type="NOA" address="0x00009888" value="0x501F0024" />
+        <register type="NOA" address="0x00009888" value="0x3E1F0100" />
+        <register type="NOA" address="0x00009888" value="0x4C1F3030" />
+        <register type="NOA" address="0x00009888" value="0x401F0000" />
+        <register type="NOA" address="0x00009888" value="0x421F3000" />
+        <register type="NOA" address="0x00009888" value="0x441F3330" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x10800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00000002" />
+        <register type="OA" address="0x00002774" value="0x0000FFFE" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+    </register_config>
+  </set>
+
+  <set name="Metric set RasterizerAndPixelBackend"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="rasterizer_and_pixel_backend"
+       hw_config_guid="0316ce4f-e03f-4738-8262-13528fce8eea"
+       chipset="ICL"
+       symbol_name="RasterizerAndPixelBackend"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 Pipe0 PS Output Available"
+             description="The percentage of time in which slice0 pipe0 PS output is available"
+             data_type="float"
+             max_equation="100"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_output00_available"
+             units="percent"
+             symbol_name="PSOutput00Available"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Slice0 Pipe1 PS Output Available"
+             description="The percentage of time in which slice0 pipe1 PS output is available"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_output01_available"
+             units="percent"
+             symbol_name="PSOutput01Available"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Slice0 Pipe1 Pixel Values Ready"
+             description="The percentage of time in which slice0 pipe1 pixel values are ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="pixel_values01_ready"
+             units="percent"
+             symbol_name="PixelValues01Ready"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Slice0 Pipe0 Post-EarlyZ Pixel Data Ready"
+             description="The percentage of time in which slice0  pipe0 post-EarlyZ pixel data is ready (after early Z tests have been applied)"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="pixel_data00_ready"
+             units="percent"
+             symbol_name="PixelData00Ready"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer/Early Depth Test"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="Slice0 Pipe1 Post-EarlyZ Pixel Data Ready"
+             description="The percentage of time in which slice0  pipe1 post-EarlyZ pixel data is ready (after early Z tests have been applied)"
+             data_type="float"
+             max_equation="100"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="pixel_data01_ready"
+             units="percent"
+             symbol_name="PixelData01Ready"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer/Early Depth Test"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="Slice0 Rasterizer Input Available"
+             description="The percentage of time in which slice0 rasterizer input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="rasterizer0_input_available"
+             units="percent"
+             symbol_name="Rasterizer0InputAvailable"
+             availability="$SliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="Slice0 Pipe0 Pixel Values Ready"
+             description="The percentage of time in which slice0 pipe0 pixel values are ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="pixel_values00_ready"
+             units="percent"
+             symbol_name="PixelValues00Ready"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 Rasterizer Output Ready"
+             description="The percentage of time in which slice0 rasterizer output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="rasterizer0_output_ready"
+             units="percent"
+             symbol_name="Rasterizer0OutputReady"
+             availability="$SliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="$ShaderMemoryAccesses 64 UMUL"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009840" value="0x00000000" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x140A001F" />
+        <register type="NOA" address="0x00009888" value="0x040C5000" />
+        <register type="NOA" address="0x00009888" value="0x140F001F" />
+        <register type="NOA" address="0x00009888" value="0x04115017" />
+        <register type="NOA" address="0x00009888" value="0x10136000" />
+        <register type="NOA" address="0x00009888" value="0x1213001C" />
+        <register type="NOA" address="0x00009888" value="0x16140000" />
+        <register type="NOA" address="0x00009888" value="0x10160018" />
+        <register type="NOA" address="0x00009888" value="0x101A0018" />
+        <register type="NOA" address="0x00009888" value="0x0C045400" />
+        <register type="NOA" address="0x00009888" value="0x0E045545" />
+        <register type="NOA" address="0x00009888" value="0x04055000" />
+        <register type="NOA" address="0x00009888" value="0x0A055000" />
+        <register type="NOA" address="0x00009888" value="0x0C055000" />
+        <register type="NOA" address="0x00009888" value="0x0E051000" />
+        <register type="NOA" address="0x00009888" value="0x06055000" />
+        <register type="NOA" address="0x00009888" value="0x08051000" />
+        <register type="NOA" address="0x00009888" value="0x2406DF00" />
+        <register type="NOA" address="0x00009888" value="0x26060007" />
+        <register type="NOA" address="0x00009888" value="0x00084000" />
+        <register type="NOA" address="0x00009888" value="0x02084000" />
+        <register type="NOA" address="0x00009888" value="0x04094000" />
+        <register type="NOA" address="0x00009888" value="0x06094000" />
+        <register type="NOA" address="0x00009888" value="0x000A3080" />
+        <register type="NOA" address="0x00009888" value="0x160A0000" />
+        <register type="NOA" address="0x00009888" value="0x080A0000" />
+        <register type="NOA" address="0x00009888" value="0x0A0A8000" />
+        <register type="NOA" address="0x00009888" value="0x020C05C0" />
+        <register type="NOA" address="0x00009888" value="0x080C0000" />
+        <register type="NOA" address="0x00009888" value="0x020D1000" />
+        <register type="NOA" address="0x00009888" value="0x040D1000" />
+        <register type="NOA" address="0x00009888" value="0x060E1000" />
+        <register type="NOA" address="0x00009888" value="0x080E1000" />
+        <register type="NOA" address="0x00009888" value="0x020F0061" />
+        <register type="NOA" address="0x00009888" value="0x160F0000" />
+        <register type="NOA" address="0x00009888" value="0x0A0F0000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F4000" />
+        <register type="NOA" address="0x00009888" value="0x08110000" />
+        <register type="NOA" address="0x00009888" value="0x18120C00" />
+        <register type="NOA" address="0x00009888" value="0x02128000" />
+        <register type="NOA" address="0x00009888" value="0x06128000" />
+        <register type="NOA" address="0x00009888" value="0x0613092F" />
+        <register type="NOA" address="0x00009888" value="0x08134025" />
+        <register type="NOA" address="0x00009888" value="0x0C130000" />
+        <register type="NOA" address="0x00009888" value="0x0413A000" />
+        <register type="NOA" address="0x00009888" value="0x00148066" />
+        <register type="NOA" address="0x00009888" value="0x10140000" />
+        <register type="NOA" address="0x00009888" value="0x0614C000" />
+        <register type="NOA" address="0x00009888" value="0x08144000" />
+        <register type="NOA" address="0x00009888" value="0x0A144000" />
+        <register type="NOA" address="0x00009888" value="0x02148000" />
+        <register type="NOA" address="0x00009888" value="0x00154000" />
+        <register type="NOA" address="0x00009888" value="0x0E154000" />
+        <register type="NOA" address="0x00009888" value="0x161500E8" />
+        <register type="NOA" address="0x00009888" value="0x02154000" />
+        <register type="NOA" address="0x00009888" value="0x04158000" />
+        <register type="NOA" address="0x00009888" value="0x06154000" />
+        <register type="NOA" address="0x00009888" value="0x08158000" />
+        <register type="NOA" address="0x00009888" value="0x0C154000" />
+        <register type="NOA" address="0x00009888" value="0x08161000" />
+        <register type="NOA" address="0x00009888" value="0x08184000" />
+        <register type="NOA" address="0x00009888" value="0x12190100" />
+        <register type="NOA" address="0x00009888" value="0x0A1A0020" />
+        <register type="NOA" address="0x00009888" value="0x081A0000" />
+        <register type="NOA" address="0x00009888" value="0x0A1C1000" />
+        <register type="NOA" address="0x00009888" value="0x121D0400" />
+        <register type="NOA" address="0x00009884" value="0x00000003" />
+        <register type="NOA" address="0x00009888" value="0x1C1F3000" />
+        <register type="NOA" address="0x00009888" value="0x1A1F0061" />
+        <register type="NOA" address="0x00009888" value="0x181F0000" />
+        <register type="NOA" address="0x00009888" value="0x301F8000" />
+        <register type="NOA" address="0x00009888" value="0x501F4904" />
+        <register type="NOA" address="0x00009888" value="0x521F0024" />
+        <register type="NOA" address="0x00009888" value="0x3A1F8000" />
+        <register type="NOA" address="0x00009888" value="0x4E1F2400" />
+        <register type="NOA" address="0x00009888" value="0x3E1F6000" />
+        <register type="NOA" address="0x00009888" value="0x461F5050" />
+        <register type="NOA" address="0x00009888" value="0x481F1040" />
+        <register type="NOA" address="0x00009888" value="0x401F4010" />
+        <register type="NOA" address="0x00009888" value="0x421F3000" />
+        <register type="NOA" address="0x00009888" value="0x441F5033" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x70800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00000038" />
+        <register type="OA" address="0x00002774" value="0x0000FFF8" />
+        <register type="OA" address="0x00002778" value="0x00000002" />
+        <register type="OA" address="0x0000277C" value="0x0000FFF7" />
+        <register type="OA" address="0x00002780" value="0x00000002" />
+        <register type="OA" address="0x00002784" value="0x0000FFEF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+    </register_config>
+  </set>
+
+  <set name="Metric set L3_1"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="l3_1"
+       hw_config_guid="21d69ec3-91e1-48a8-acd6-c0c4ec6e819a"
+       chipset="ICL"
+       symbol_name="L3_1"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank1 Active"
+             description="The percentage of time in which slice0 L3 bank1 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank1_active"
+             units="percent"
+             symbol_name="L30Bank1Active"
+             availability="$SliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="B 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Slice0 L3 Bank5 Active"
+             description="The percentage of time in which slice0 L3 bank5 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank5_active"
+             units="percent"
+             symbol_name="L30Bank5Active"
+             availability="$SliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank3 Active"
+             description="The percentage of time in which slice0 L3 bank3 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank3_active"
+             units="percent"
+             symbol_name="L30Bank3Active"
+             availability="$SliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank6 Active"
+             description="The percentage of time in which slice0 L3 bank6 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank6_active"
+             units="percent"
+             symbol_name="L30Bank6Active"
+             availability="$SliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Slice0 L3 Bank2 Active"
+             description="The percentage of time in which slice0 L3 bank2 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank2_active"
+             units="percent"
+             symbol_name="L30Bank2Active"
+             availability="$SliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Slice0 L3 Bank0 Active"
+             description="The percentage of time in which slice0 L3 bank0 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank0_active"
+             units="percent"
+             symbol_name="L30Bank0Active"
+             availability="$SliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Slice0 L3 Bank7 Active"
+             description="The percentage of time in which slice0 L3 bank7 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank7_active"
+             units="percent"
+             symbol_name="L30Bank7Active"
+             availability="$SliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Slice0 L3 Bank4 Active"
+             description="The percentage of time in which slice0 L3 bank4 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank4_active"
+             units="percent"
+             symbol_name="L30Bank4Active"
+             availability="$SliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="$ShaderMemoryAccesses 64 UMUL"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009840" value="0x00000000" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x17340000" />
+        <register type="NOA" address="0x00009888" value="0x17740000" />
+        <register type="NOA" address="0x00009888" value="0x17B40000" />
+        <register type="NOA" address="0x00009888" value="0x17F40000" />
+        <register type="NOA" address="0x00009888" value="0x16340000" />
+        <register type="NOA" address="0x00009888" value="0x16740000" />
+        <register type="NOA" address="0x00009888" value="0x16B40000" />
+        <register type="NOA" address="0x00009888" value="0x16F40000" />
+        <register type="NOA" address="0x00009888" value="0x07340037" />
+        <register type="NOA" address="0x00009888" value="0x21340000" />
+        <register type="NOA" address="0x00009888" value="0x09740037" />
+        <register type="NOA" address="0x00009888" value="0x21740000" />
+        <register type="NOA" address="0x00009888" value="0x0BB40037" />
+        <register type="NOA" address="0x00009888" value="0x21B40000" />
+        <register type="NOA" address="0x00009888" value="0x0DF40037" />
+        <register type="NOA" address="0x00009888" value="0x21F40000" />
+        <register type="NOA" address="0x00009888" value="0x0E0000A7" />
+        <register type="NOA" address="0x00009888" value="0x08012000" />
+        <register type="NOA" address="0x00009888" value="0x0A034000" />
+        <register type="NOA" address="0x00009888" value="0x0C038000" />
+        <register type="NOA" address="0x00009888" value="0x1C340037" />
+        <register type="NOA" address="0x00009888" value="0x20340000" />
+        <register type="NOA" address="0x00009888" value="0x1E740037" />
+        <register type="NOA" address="0x00009888" value="0x20740000" />
+        <register type="NOA" address="0x00009888" value="0x02B40037" />
+        <register type="NOA" address="0x00009888" value="0x20B40000" />
+        <register type="NOA" address="0x00009888" value="0x04F40037" />
+        <register type="NOA" address="0x00009888" value="0x20F40000" />
+        <register type="NOA" address="0x00009888" value="0x10040200" />
+        <register type="NOA" address="0x00009888" value="0x0E040055" />
+        <register type="NOA" address="0x00009888" value="0x14050070" />
+        <register type="NOA" address="0x00009888" value="0x04058000" />
+        <register type="NOA" address="0x00009888" value="0x06056000" />
+        <register type="NOA" address="0x00009888" value="0x08055000" />
+        <register type="NOA" address="0x00009888" value="0x0A051000" />
+        <register type="NOA" address="0x00009888" value="0x260600C0" />
+        <register type="NOA" address="0x00009888" value="0x24067E00" />
+        <register type="NOA" address="0x00009888" value="0x02074000" />
+        <register type="NOA" address="0x00009888" value="0x04078000" />
+        <register type="NOA" address="0x00009888" value="0x06124000" />
+        <register type="NOA" address="0x00009888" value="0x08124000" />
+        <register type="NOA" address="0x00009888" value="0x0A124000" />
+        <register type="NOA" address="0x00009888" value="0x0C124000" />
+        <register type="NOA" address="0x00009888" value="0x04138000" />
+        <register type="NOA" address="0x00009888" value="0x06137000" />
+        <register type="NOA" address="0x00009888" value="0x02148000" />
+        <register type="NOA" address="0x00009888" value="0x0414C000" />
+        <register type="NOA" address="0x00009888" value="0x06144000" />
+        <register type="NOA" address="0x00009888" value="0x06154000" />
+        <register type="NOA" address="0x00009888" value="0x08154000" />
+        <register type="NOA" address="0x00009888" value="0x0A154000" />
+        <register type="NOA" address="0x00009888" value="0x0C154000" />
+        <register type="NOA" address="0x00009884" value="0x00000003" />
+        <register type="NOA" address="0x00009888" value="0x1C1F3000" />
+        <register type="NOA" address="0x00009888" value="0x2A1F0061" />
+        <register type="NOA" address="0x00009888" value="0x181F0000" />
+        <register type="NOA" address="0x00009888" value="0x521F0000" />
+        <register type="NOA" address="0x00009888" value="0x541F0024" />
+        <register type="NOA" address="0x00009888" value="0x3A1F8000" />
+        <register type="NOA" address="0x00009888" value="0x4E1F2460" />
+        <register type="NOA" address="0x00009888" value="0x501F0124" />
+        <register type="NOA" address="0x00009888" value="0x4C1F0133" />
+        <register type="NOA" address="0x00009888" value="0x301F0000" />
+        <register type="NOA" address="0x00009888" value="0x401F6060" />
+        <register type="NOA" address="0x00009888" value="0x421F0010" />
+        <register type="NOA" address="0x00009888" value="0x441F0000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+    </register_config>
+  </set>
+
+  <set name="Gen11 L2Bank0 stalled metric set"
+       mdapi_supported_apis="VK OGL OGL4 OCL MEDIA IO BB"
+       underscore_name="l3_2"
+       hw_config_guid="e60e9155-6830-4aec-baf2-1c3c15a73869"
+       chipset="ICL"
+       symbol_name="L3_2"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 14 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank0 Stalled"
+             description="The percentage of time in which slice0 L3 bank0 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ B 1 READ FADD B 2 READ FADD B 3 READ FADD 4 FDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank0_stalled"
+             units="percent"
+             symbol_name="L30Bank0Stalled"
+             availability="$SliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="EU Thread Occupancy"
+             description="The percentage of time in which hardware threads occupied EUs."
+             data_type="float"
+             max_equation="100"
+             equation="8 A 10 READ FMUL $EuThreadsCount FDIV $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_thread_occupancy"
+             units="percent"
+             symbol_name="EuThreadOccupancy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009840" value="0x00000000" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x10050C00" />
+        <register type="NOA" address="0x00009888" value="0x12050002" />
+        <register type="NOA" address="0x00009888" value="0x00050025" />
+        <register type="NOA" address="0x00009888" value="0x06050900" />
+        <register type="NOA" address="0x00009888" value="0x080508EA" />
+        <register type="NOA" address="0x00009888" value="0x0A0508AB" />
+        <register type="NOA" address="0x00009888" value="0x0C050A21" />
+        <register type="NOA" address="0x00009888" value="0x0E050A60" />
+        <register type="NOA" address="0x00009888" value="0x04050000" />
+        <register type="NOA" address="0x00009888" value="0x14050000" />
+        <register type="NOA" address="0x00009888" value="0x24068100" />
+        <register type="NOA" address="0x00009888" value="0x260600FF" />
+        <register type="NOA" address="0x00009884" value="0x00000003" />
+        <register type="NOA" address="0x00009888" value="0x301F8000" />
+        <register type="NOA" address="0x00009888" value="0x501F4800" />
+        <register type="NOA" address="0x00009888" value="0x521F4924" />
+        <register type="NOA" address="0x00009888" value="0x541F0024" />
+        <register type="NOA" address="0x00009888" value="0x3E1F0000" />
+        <register type="NOA" address="0x00009888" value="0x461F0000" />
+        <register type="NOA" address="0x00009888" value="0x481F0000" />
+        <register type="NOA" address="0x00009888" value="0x4A1F0000" />
+        <register type="NOA" address="0x00009888" value="0x4C1F0000" />
+        <register type="NOA" address="0x00009888" value="0x181F0000" />
+        <register type="NOA" address="0x00009888" value="0x4E1F0000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00000022" />
+        <register type="OA" address="0x00002774" value="0x0000FFF8" />
+        <register type="OA" address="0x00002778" value="0x00000082" />
+        <register type="OA" address="0x0000277C" value="0x0000FFE7" />
+        <register type="OA" address="0x00002780" value="0x00000402" />
+        <register type="OA" address="0x00002784" value="0x0000FF1F" />
+        <register type="OA" address="0x00002788" value="0x00001002" />
+        <register type="OA" address="0x0000278C" value="0x0000FCFF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00008003" />
+        <register type="FLEX" address="0x0000E658" value="0x00011010" />
+        <register type="FLEX" address="0x0000E758" value="0x00050012" />
+        <register type="FLEX" address="0x0000E45C" value="0x00052051" />
+        <register type="FLEX" address="0x0000E55C" value="0x00000053" />
+    </register_config>
+  </set>
+
+  <set name="Gen11 L2Bank1 stalled metric set"
+       mdapi_supported_apis="VK OGL OGL4 OCL MEDIA IO BB"
+       underscore_name="l3_3"
+       hw_config_guid="47c364d5-1799-4d17-9447-add9358c6451"
+       chipset="ICL"
+       symbol_name="L3_3"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="Slice0 L3 Bank1 Stalled"
+             description="The percentage of time in which slice0 L3 bank1 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ B 1 READ FADD B 2 READ FADD B 3 READ FADD 4 FDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank1_stalled"
+             units="percent"
+             symbol_name="L30Bank1Stalled"
+             availability="$SliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 14 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="EU Thread Occupancy"
+             description="The percentage of time in which hardware threads occupied EUs."
+             data_type="float"
+             max_equation="100"
+             equation="8 A 10 READ FMUL $EuThreadsCount FDIV $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_thread_occupancy"
+             units="percent"
+             symbol_name="EuThreadOccupancy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009840" value="0x00000000" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x10050400" />
+        <register type="NOA" address="0x00009888" value="0x12050000" />
+        <register type="NOA" address="0x00009888" value="0x00050025" />
+        <register type="NOA" address="0x00009888" value="0x06050900" />
+        <register type="NOA" address="0x00009888" value="0x080508EA" />
+        <register type="NOA" address="0x00009888" value="0x0A0508AB" />
+        <register type="NOA" address="0x00009888" value="0x0C050A21" />
+        <register type="NOA" address="0x00009888" value="0x0E050A60" />
+        <register type="NOA" address="0x00009888" value="0x04050000" />
+        <register type="NOA" address="0x00009888" value="0x14050000" />
+        <register type="NOA" address="0x00009888" value="0x24068100" />
+        <register type="NOA" address="0x00009888" value="0x260600FF" />
+        <register type="NOA" address="0x00009884" value="0x00000003" />
+        <register type="NOA" address="0x00009888" value="0x301F8000" />
+        <register type="NOA" address="0x00009888" value="0x501F4800" />
+        <register type="NOA" address="0x00009888" value="0x521F4924" />
+        <register type="NOA" address="0x00009888" value="0x541F0024" />
+        <register type="NOA" address="0x00009888" value="0x3E1F0000" />
+        <register type="NOA" address="0x00009888" value="0x461F0000" />
+        <register type="NOA" address="0x00009888" value="0x481F0000" />
+        <register type="NOA" address="0x00009888" value="0x4A1F0000" />
+        <register type="NOA" address="0x00009888" value="0x4C1F0000" />
+        <register type="NOA" address="0x00009888" value="0x181F0000" />
+        <register type="NOA" address="0x00009888" value="0x4E1F0000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00000022" />
+        <register type="OA" address="0x00002774" value="0x0000FFF8" />
+        <register type="OA" address="0x00002778" value="0x00000082" />
+        <register type="OA" address="0x0000277C" value="0x0000FFE7" />
+        <register type="OA" address="0x00002780" value="0x00000402" />
+        <register type="OA" address="0x00002784" value="0x0000FF1F" />
+        <register type="OA" address="0x00002788" value="0x00001002" />
+        <register type="OA" address="0x0000278C" value="0x0000FCFF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00008003" />
+        <register type="FLEX" address="0x0000E658" value="0x00011010" />
+        <register type="FLEX" address="0x0000E758" value="0x00050012" />
+        <register type="FLEX" address="0x0000E45C" value="0x00052051" />
+        <register type="FLEX" address="0x0000E55C" value="0x00000053" />
+    </register_config>
+  </set>
+
+  <set name="Gen11 L2Bank4 stalled metric set"
+       mdapi_supported_apis="VK OGL OGL4 OCL MEDIA IO BB"
+       underscore_name="l3_4"
+       hw_config_guid="e5ab5c08-3130-4469-8eaf-b23d3dc817d4"
+       chipset="ICL"
+       symbol_name="L3_4"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 14 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Slice0 L3 Bank4 Stalled"
+             description="The percentage of time in which slice0 L3 bank4 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ B 1 READ FADD B 2 READ FADD B 3 READ FADD 4 FDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank4_stalled"
+             units="percent"
+             symbol_name="L30Bank4Stalled"
+             availability="$SliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="EU Thread Occupancy"
+             description="The percentage of time in which hardware threads occupied EUs."
+             data_type="float"
+             max_equation="100"
+             equation="8 A 10 READ FMUL $EuThreadsCount FDIV $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_thread_occupancy"
+             units="percent"
+             symbol_name="EuThreadOccupancy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009840" value="0x00000000" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x10010C00" />
+        <register type="NOA" address="0x00009888" value="0x12010002" />
+        <register type="NOA" address="0x00009888" value="0x0C000400" />
+        <register type="NOA" address="0x00009888" value="0x0E005500" />
+        <register type="NOA" address="0x00009888" value="0x10000155" />
+        <register type="NOA" address="0x00009888" value="0x00010025" />
+        <register type="NOA" address="0x00009888" value="0x06010900" />
+        <register type="NOA" address="0x00009888" value="0x080108EA" />
+        <register type="NOA" address="0x00009888" value="0x0A0108AB" />
+        <register type="NOA" address="0x00009888" value="0x0C010A21" />
+        <register type="NOA" address="0x00009888" value="0x0E010A60" />
+        <register type="NOA" address="0x00009888" value="0x04010000" />
+        <register type="NOA" address="0x00009888" value="0x14010000" />
+        <register type="NOA" address="0x00009888" value="0x0C040400" />
+        <register type="NOA" address="0x00009888" value="0x0E045500" />
+        <register type="NOA" address="0x00009888" value="0x10040155" />
+        <register type="NOA" address="0x00009888" value="0x04051000" />
+        <register type="NOA" address="0x00009888" value="0x0A054000" />
+        <register type="NOA" address="0x00009888" value="0x0C055000" />
+        <register type="NOA" address="0x00009888" value="0x0E055000" />
+        <register type="NOA" address="0x00009888" value="0x14050055" />
+        <register type="NOA" address="0x00009888" value="0x24068100" />
+        <register type="NOA" address="0x00009888" value="0x260600FF" />
+        <register type="NOA" address="0x00009888" value="0x00124000" />
+        <register type="NOA" address="0x00009888" value="0x0E124000" />
+        <register type="NOA" address="0x00009888" value="0x18125540" />
+        <register type="NOA" address="0x00009888" value="0x1A120015" />
+        <register type="NOA" address="0x00009888" value="0x04131000" />
+        <register type="NOA" address="0x00009888" value="0x06138000" />
+        <register type="NOA" address="0x00009888" value="0x0813F000" />
+        <register type="NOA" address="0x00009888" value="0x0A13F000" />
+        <register type="NOA" address="0x00009888" value="0x00144000" />
+        <register type="NOA" address="0x00009888" value="0x06148000" />
+        <register type="NOA" address="0x00009888" value="0x0814C000" />
+        <register type="NOA" address="0x00009888" value="0x0A14C000" />
+        <register type="NOA" address="0x00009888" value="0x0C14C000" />
+        <register type="NOA" address="0x00009888" value="0x0E14C000" />
+        <register type="NOA" address="0x00009888" value="0x00154000" />
+        <register type="NOA" address="0x00009888" value="0x0E154000" />
+        <register type="NOA" address="0x00009888" value="0x16152AA8" />
+        <register type="NOA" address="0x00009888" value="0x18150005" />
+        <register type="NOA" address="0x00009884" value="0x00000003" />
+        <register type="NOA" address="0x00009888" value="0x301F8000" />
+        <register type="NOA" address="0x00009888" value="0x501F4800" />
+        <register type="NOA" address="0x00009888" value="0x521F4924" />
+        <register type="NOA" address="0x00009888" value="0x541F0024" />
+        <register type="NOA" address="0x00009888" value="0x3E1F0000" />
+        <register type="NOA" address="0x00009888" value="0x461F0000" />
+        <register type="NOA" address="0x00009888" value="0x481F0000" />
+        <register type="NOA" address="0x00009888" value="0x4A1F0000" />
+        <register type="NOA" address="0x00009888" value="0x4C1F0000" />
+        <register type="NOA" address="0x00009888" value="0x181F0000" />
+        <register type="NOA" address="0x00009888" value="0x4E1F0000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00000022" />
+        <register type="OA" address="0x00002774" value="0x0000FFF8" />
+        <register type="OA" address="0x00002778" value="0x00000082" />
+        <register type="OA" address="0x0000277C" value="0x0000FFE7" />
+        <register type="OA" address="0x00002780" value="0x00000402" />
+        <register type="OA" address="0x00002784" value="0x0000FF1F" />
+        <register type="OA" address="0x00002788" value="0x00001002" />
+        <register type="OA" address="0x0000278C" value="0x0000FCFF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00008003" />
+        <register type="FLEX" address="0x0000E658" value="0x00011010" />
+        <register type="FLEX" address="0x0000E758" value="0x00050012" />
+        <register type="FLEX" address="0x0000E45C" value="0x00052051" />
+        <register type="FLEX" address="0x0000E55C" value="0x00000053" />
+    </register_config>
+  </set>
+
+  <set name="Gen11 L2Bank5 stalled metric set"
+       mdapi_supported_apis="VK OGL OGL4 OCL MEDIA IO BB"
+       underscore_name="l3_5"
+       hw_config_guid="6cdf23c1-f725-414c-959a-c90fa5571b1f"
+       chipset="ICL"
+       symbol_name="L3_5"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 14 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Slice0 L3 Bank5 Stalled"
+             description="The percentage of time in which slice0 L3 bank5 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 2 READ B 3 READ FADD B 0 READ FADD B 1 READ FADD 4 FDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank5_stalled"
+             units="percent"
+             symbol_name="L30Bank5Stalled"
+             availability="$SliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="EU Thread Occupancy"
+             description="The percentage of time in which hardware threads occupied EUs."
+             data_type="float"
+             max_equation="100"
+             equation="8 A 10 READ FMUL $EuThreadsCount FDIV $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_thread_occupancy"
+             units="percent"
+             symbol_name="EuThreadOccupancy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009840" value="0x00000000" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x10010400" />
+        <register type="NOA" address="0x00009888" value="0x12010000" />
+        <register type="NOA" address="0x00009888" value="0x0C000400" />
+        <register type="NOA" address="0x00009888" value="0x0E005500" />
+        <register type="NOA" address="0x00009888" value="0x10000155" />
+        <register type="NOA" address="0x00009888" value="0x00010022" />
+        <register type="NOA" address="0x00009888" value="0x06010840" />
+        <register type="NOA" address="0x00009888" value="0x08010828" />
+        <register type="NOA" address="0x00009888" value="0x0A010969" />
+        <register type="NOA" address="0x00009888" value="0x0C010AA4" />
+        <register type="NOA" address="0x00009888" value="0x0E010AE3" />
+        <register type="NOA" address="0x00009888" value="0x04010000" />
+        <register type="NOA" address="0x00009888" value="0x14010000" />
+        <register type="NOA" address="0x00009888" value="0x0C040400" />
+        <register type="NOA" address="0x00009888" value="0x0E045500" />
+        <register type="NOA" address="0x00009888" value="0x10040155" />
+        <register type="NOA" address="0x00009888" value="0x04051000" />
+        <register type="NOA" address="0x00009888" value="0x0A054000" />
+        <register type="NOA" address="0x00009888" value="0x0C055000" />
+        <register type="NOA" address="0x00009888" value="0x0E055000" />
+        <register type="NOA" address="0x00009888" value="0x14050055" />
+        <register type="NOA" address="0x00009888" value="0x24068100" />
+        <register type="NOA" address="0x00009888" value="0x260600FF" />
+        <register type="NOA" address="0x00009888" value="0x00124000" />
+        <register type="NOA" address="0x00009888" value="0x0E124000" />
+        <register type="NOA" address="0x00009888" value="0x18125540" />
+        <register type="NOA" address="0x00009888" value="0x1A120015" />
+        <register type="NOA" address="0x00009888" value="0x04131000" />
+        <register type="NOA" address="0x00009888" value="0x06138000" />
+        <register type="NOA" address="0x00009888" value="0x0813F000" />
+        <register type="NOA" address="0x00009888" value="0x0A13F000" />
+        <register type="NOA" address="0x00009888" value="0x00144000" />
+        <register type="NOA" address="0x00009888" value="0x06148000" />
+        <register type="NOA" address="0x00009888" value="0x0814C000" />
+        <register type="NOA" address="0x00009888" value="0x0A14C000" />
+        <register type="NOA" address="0x00009888" value="0x0C14C000" />
+        <register type="NOA" address="0x00009888" value="0x0E14C000" />
+        <register type="NOA" address="0x00009888" value="0x00154000" />
+        <register type="NOA" address="0x00009888" value="0x0E154000" />
+        <register type="NOA" address="0x00009888" value="0x16152AA8" />
+        <register type="NOA" address="0x00009888" value="0x18150005" />
+        <register type="NOA" address="0x00009884" value="0x00000003" />
+        <register type="NOA" address="0x00009888" value="0x301F8000" />
+        <register type="NOA" address="0x00009888" value="0x501F4800" />
+        <register type="NOA" address="0x00009888" value="0x521F4924" />
+        <register type="NOA" address="0x00009888" value="0x541F0024" />
+        <register type="NOA" address="0x00009888" value="0x3E1F0000" />
+        <register type="NOA" address="0x00009888" value="0x461F0000" />
+        <register type="NOA" address="0x00009888" value="0x481F0000" />
+        <register type="NOA" address="0x00009888" value="0x4A1F0000" />
+        <register type="NOA" address="0x00009888" value="0x4C1F0000" />
+        <register type="NOA" address="0x00009888" value="0x181F0000" />
+        <register type="NOA" address="0x00009888" value="0x4E1F0000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00000022" />
+        <register type="OA" address="0x00002774" value="0x0000FFF8" />
+        <register type="OA" address="0x00002778" value="0x00000082" />
+        <register type="OA" address="0x0000277C" value="0x0000FFE7" />
+        <register type="OA" address="0x00002780" value="0x00000402" />
+        <register type="OA" address="0x00002784" value="0x0000FF1F" />
+        <register type="OA" address="0x00002788" value="0x00001002" />
+        <register type="OA" address="0x0000278C" value="0x0000FCFF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00008003" />
+        <register type="FLEX" address="0x0000E658" value="0x00011010" />
+        <register type="FLEX" address="0x0000E758" value="0x00050012" />
+        <register type="FLEX" address="0x0000E45C" value="0x00052051" />
+        <register type="FLEX" address="0x0000E55C" value="0x00000053" />
+    </register_config>
+  </set>
+
+  <set name="Metric set Sampler 1"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="sampler_1"
+       hw_config_guid="51a2eb6d-9fad-4489-8f22-ab845fe7882a"
+       chipset="ICL"
+       symbol_name="Sampler_1"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 Subslice2 Input Available"
+             description="The percentage of time in which slice0 subslice2 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler02_input_available"
+             units="percent"
+             symbol_name="Sampler02InputAvailable"
+             availability="$SubsliceMask 4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 Subslice0 Input Available"
+             description="The percentage of time in which slice0 subslice0 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler00_input_available"
+             units="percent"
+             symbol_name="Sampler00InputAvailable"
+             availability="$SubsliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Slice0 Subslice1 Input Available"
+             description="The percentage of time in which slice0 subslice1 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler01_input_available"
+             units="percent"
+             symbol_name="Sampler01InputAvailable"
+             availability="$SubsliceMask 2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Slice0 Subslice6 Input Available"
+             description="The percentage of time in which slice0 subslice6 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler06_input_available"
+             units="percent"
+             symbol_name="Sampler06InputAvailable"
+             availability="$SubsliceMask 64 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 Subslice4 Input Available"
+             description="The percentage of time in which slice0 subslice4 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler04_input_available"
+             units="percent"
+             symbol_name="Sampler04InputAvailable"
+             availability="$SubsliceMask 16 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="Slice0 Subslice3 Input Available"
+             description="The percentage of time in which slice0 subslice3 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler03_input_available"
+             units="percent"
+             symbol_name="Sampler03InputAvailable"
+             availability="$SubsliceMask 8 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 Subslice5 Input Available"
+             description="The percentage of time in which slice0 subslice5 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler05_input_available"
+             units="percent"
+             symbol_name="Sampler05InputAvailable"
+             availability="$SubsliceMask 32 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Slice0 Subslice7 Input Available"
+             description="The percentage of time in which slice0 subslice7 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler07_input_available"
+             units="percent"
+             symbol_name="Sampler07InputAvailable"
+             availability="$SubsliceMask 128 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="$ShaderMemoryAccesses 64 UMUL"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009840" value="0x00000000" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x142A0165" />
+        <register type="NOA" address="0x00009888" value="0x142F0165" />
+        <register type="NOA" address="0x00009888" value="0x146A0165" />
+        <register type="NOA" address="0x00009888" value="0x146F0165" />
+        <register type="NOA" address="0x00009888" value="0x14AA0165" />
+        <register type="NOA" address="0x00009888" value="0x14AF0165" />
+        <register type="NOA" address="0x00009888" value="0x14EA0165" />
+        <register type="NOA" address="0x00009888" value="0x14EF0165" />
+        <register type="NOA" address="0x00009888" value="0x161E8000" />
+        <register type="NOA" address="0x00009888" value="0x181EC000" />
+        <register type="NOA" address="0x00009888" value="0x1A1E0400" />
+        <register type="NOA" address="0x00009888" value="0x061F8000" />
+        <register type="NOA" address="0x00009888" value="0x081F8000" />
+        <register type="NOA" address="0x00009888" value="0x0A1F8000" />
+        <register type="NOA" address="0x00009888" value="0x0C1F0400" />
+        <register type="NOA" address="0x00009888" value="0x06204000" />
+        <register type="NOA" address="0x00009888" value="0x08204000" />
+        <register type="NOA" address="0x00009888" value="0x0A204000" />
+        <register type="NOA" address="0x00009888" value="0x0C204000" />
+        <register type="NOA" address="0x00009888" value="0x06218000" />
+        <register type="NOA" address="0x00009888" value="0x08218000" />
+        <register type="NOA" address="0x00009888" value="0x0A218000" />
+        <register type="NOA" address="0x00009888" value="0x0C218000" />
+        <register type="NOA" address="0x00009888" value="0x042A1800" />
+        <register type="NOA" address="0x00009888" value="0x062AC038" />
+        <register type="NOA" address="0x00009888" value="0x102A0000" />
+        <register type="NOA" address="0x00009888" value="0x082AC000" />
+        <register type="NOA" address="0x00009888" value="0x0A2A0000" />
+        <register type="NOA" address="0x00009888" value="0x0C2A0000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0E2C8000" />
+        <register type="NOA" address="0x00009888" value="0x182C0002" />
+        <register type="NOA" address="0x00009888" value="0x022F2000" />
+        <register type="NOA" address="0x00009888" value="0x042F0048" />
+        <register type="NOA" address="0x00009888" value="0x102F0000" />
+        <register type="NOA" address="0x00009888" value="0x1C5E000C" />
+        <register type="NOA" address="0x00009888" value="0x125E8000" />
+        <register type="NOA" address="0x00009888" value="0x145E8000" />
+        <register type="NOA" address="0x00009888" value="0x0E5F000C" />
+        <register type="NOA" address="0x00009888" value="0x025F8000" />
+        <register type="NOA" address="0x00009888" value="0x045F8000" />
+        <register type="NOA" address="0x00009888" value="0x1C600014" />
+        <register type="NOA" address="0x00009888" value="0x02604000" />
+        <register type="NOA" address="0x00009888" value="0x04604000" />
+        <register type="NOA" address="0x00009888" value="0x16612800" />
+        <register type="NOA" address="0x00009888" value="0x02618000" />
+        <register type="NOA" address="0x00009888" value="0x04618000" />
+        <register type="NOA" address="0x00009888" value="0x006A1800" />
+        <register type="NOA" address="0x00009888" value="0x026A0038" />
+        <register type="NOA" address="0x00009888" value="0x106A0000" />
+        <register type="NOA" address="0x00009888" value="0x1A6A00F0" />
+        <register type="NOA" address="0x00009888" value="0x046A0000" />
+        <register type="NOA" address="0x00009888" value="0x1A6C000A" />
+        <register type="NOA" address="0x00009888" value="0x066C8000" />
+        <register type="NOA" address="0x00009888" value="0x086C8000" />
+        <register type="NOA" address="0x00009888" value="0x0E6F2440" />
+        <register type="NOA" address="0x00009888" value="0x106F0000" />
+        <register type="NOA" address="0x00009888" value="0x1A9EC000" />
+        <register type="NOA" address="0x00009888" value="0x1C9E0003" />
+        <register type="NOA" address="0x00009888" value="0x0C9FC000" />
+        <register type="NOA" address="0x00009888" value="0x0E9F0003" />
+        <register type="NOA" address="0x00009888" value="0x1AA02A00" />
+        <register type="NOA" address="0x00009888" value="0x1CA00001" />
+        <register type="NOA" address="0x00009888" value="0x16A102A8" />
+        <register type="NOA" address="0x00009888" value="0x0CAA1C30" />
+        <register type="NOA" address="0x00009888" value="0x10AA0000" />
+        <register type="NOA" address="0x00009888" value="0x18AAF000" />
+        <register type="NOA" address="0x00009888" value="0x1AAA0000" />
+        <register type="NOA" address="0x00009888" value="0x18ACAA00" />
+        <register type="NOA" address="0x00009888" value="0x0AAF2440" />
+        <register type="NOA" address="0x00009888" value="0x10AF0000" />
+        <register type="NOA" address="0x00009888" value="0x10DE8000" />
+        <register type="NOA" address="0x00009888" value="0x1ADE3800" />
+        <register type="NOA" address="0x00009888" value="0x00DF8000" />
+        <register type="NOA" address="0x00009888" value="0x0CDF3800" />
+        <register type="NOA" address="0x00009888" value="0x00E04000" />
+        <register type="NOA" address="0x00009888" value="0x0EE04000" />
+        <register type="NOA" address="0x00009888" value="0x1AE000A0" />
+        <register type="NOA" address="0x00009888" value="0x00E18000" />
+        <register type="NOA" address="0x00009888" value="0x0EE18000" />
+        <register type="NOA" address="0x00009888" value="0x14E18000" />
+        <register type="NOA" address="0x00009888" value="0x16E10002" />
+        <register type="NOA" address="0x00009888" value="0x08EA1C30" />
+        <register type="NOA" address="0x00009888" value="0x10EA0000" />
+        <register type="NOA" address="0x00009888" value="0x00EAC000" />
+        <register type="NOA" address="0x00009888" value="0x0EEAC000" />
+        <register type="NOA" address="0x00009888" value="0x18EA0000" />
+        <register type="NOA" address="0x00009888" value="0x04EC8000" />
+        <register type="NOA" address="0x00009888" value="0x18EC00A8" />
+        <register type="NOA" address="0x00009888" value="0x00EF0040" />
+        <register type="NOA" address="0x00009888" value="0x06EF2400" />
+        <register type="NOA" address="0x00009888" value="0x10EF0000" />
+        <register type="NOA" address="0x00009888" value="0x0C045400" />
+        <register type="NOA" address="0x00009888" value="0x0E045555" />
+        <register type="NOA" address="0x00009888" value="0x10040155" />
+        <register type="NOA" address="0x00009888" value="0x04055000" />
+        <register type="NOA" address="0x00009888" value="0x0A055000" />
+        <register type="NOA" address="0x00009888" value="0x0C055000" />
+        <register type="NOA" address="0x00009888" value="0x0E055000" />
+        <register type="NOA" address="0x00009888" value="0x14050055" />
+        <register type="NOA" address="0x00009888" value="0x06055000" />
+        <register type="NOA" address="0x00009888" value="0x08055000" />
+        <register type="NOA" address="0x00009888" value="0x2406FF00" />
+        <register type="NOA" address="0x00009888" value="0x260600FF" />
+        <register type="NOA" address="0x00009888" value="0x0E08A000" />
+        <register type="NOA" address="0x00009888" value="0x00088000" />
+        <register type="NOA" address="0x00009888" value="0x02082000" />
+        <register type="NOA" address="0x00009888" value="0x14090050" />
+        <register type="NOA" address="0x00009888" value="0x04094000" />
+        <register type="NOA" address="0x00009888" value="0x06091000" />
+        <register type="NOA" address="0x00009888" value="0x000D2000" />
+        <register type="NOA" address="0x00009888" value="0x060D8000" />
+        <register type="NOA" address="0x00009888" value="0x080DA000" />
+        <register type="NOA" address="0x00009888" value="0x040E1000" />
+        <register type="NOA" address="0x00009888" value="0x0A0E4000" />
+        <register type="NOA" address="0x00009888" value="0x0C0E5000" />
+        <register type="NOA" address="0x00009888" value="0x1812FC00" />
+        <register type="NOA" address="0x00009888" value="0x1A12002B" />
+        <register type="NOA" address="0x00009888" value="0x02128000" />
+        <register type="NOA" address="0x00009888" value="0x04128000" />
+        <register type="NOA" address="0x00009888" value="0x0813C000" />
+        <register type="NOA" address="0x00009888" value="0x0A13F000" />
+        <register type="NOA" address="0x00009888" value="0x04136000" />
+        <register type="NOA" address="0x00009888" value="0x0A14C000" />
+        <register type="NOA" address="0x00009888" value="0x0C14C000" />
+        <register type="NOA" address="0x00009888" value="0x0E14C000" />
+        <register type="NOA" address="0x00009888" value="0x00148000" />
+        <register type="NOA" address="0x00009888" value="0x02144000" />
+        <register type="NOA" address="0x00009888" value="0x00158000" />
+        <register type="NOA" address="0x00009888" value="0x0E158000" />
+        <register type="NOA" address="0x00009888" value="0x16152AD0" />
+        <register type="NOA" address="0x00009888" value="0x18150005" />
+        <register type="NOA" address="0x00009888" value="0x02154000" />
+        <register type="NOA" address="0x00009888" value="0x04154000" />
+        <register type="NOA" address="0x00009888" value="0x0615C000" />
+        <register type="NOA" address="0x00009888" value="0x0815C000" />
+        <register type="NOA" address="0x00009888" value="0x0A15C000" />
+        <register type="NOA" address="0x00009888" value="0x0C15C000" />
+        <register type="NOA" address="0x00009888" value="0x02188000" />
+        <register type="NOA" address="0x00009888" value="0x0418A000" />
+        <register type="NOA" address="0x00009888" value="0x06182000" />
+        <register type="NOA" address="0x00009888" value="0x0A198000" />
+        <register type="NOA" address="0x00009888" value="0x0C19A000" />
+        <register type="NOA" address="0x00009888" value="0x0E192000" />
+        <register type="NOA" address="0x00009888" value="0x0A1CA000" />
+        <register type="NOA" address="0x00009888" value="0x0C1CA000" />
+        <register type="NOA" address="0x00009888" value="0x121D5400" />
+        <register type="NOA" address="0x00009888" value="0x141D0002" />
+        <register type="NOA" address="0x00009884" value="0x00000003" />
+        <register type="NOA" address="0x00009888" value="0x301F8000" />
+        <register type="NOA" address="0x00009888" value="0x501F4924" />
+        <register type="NOA" address="0x00009888" value="0x521F4924" />
+        <register type="NOA" address="0x00009888" value="0x541F0024" />
+        <register type="NOA" address="0x00009888" value="0x3A1F8000" />
+        <register type="NOA" address="0x00009888" value="0x4E1F2400" />
+        <register type="NOA" address="0x00009888" value="0x3E1F3000" />
+        <register type="NOA" address="0x00009888" value="0x461F4030" />
+        <register type="NOA" address="0x00009888" value="0x481F0040" />
+        <register type="NOA" address="0x00009888" value="0x4A1F1000" />
+        <register type="NOA" address="0x00009888" value="0x4C1F0010" />
+        <register type="NOA" address="0x00009888" value="0x181F0000" />
+        <register type="NOA" address="0x00009888" value="0x401F1010" />
+        <register type="NOA" address="0x00009888" value="0x421F3030" />
+        <register type="NOA" address="0x00009888" value="0x441F4040" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002770" value="0x00000018" />
+        <register type="OA" address="0x00002774" value="0x0000FFFC" />
+        <register type="OA" address="0x00002778" value="0x00000060" />
+        <register type="OA" address="0x0000277C" value="0x0000FFF3" />
+        <register type="OA" address="0x00002780" value="0x00000180" />
+        <register type="OA" address="0x00002784" value="0x0000FFCF" />
+        <register type="OA" address="0x00002788" value="0x00000600" />
+        <register type="OA" address="0x0000278C" value="0x0000FF3F" />
+        <register type="OA" address="0x00002790" value="0x00001800" />
+        <register type="OA" address="0x00002794" value="0x0000FCFF" />
+        <register type="OA" address="0x00002798" value="0x00006000" />
+        <register type="OA" address="0x0000279C" value="0x0000F3FF" />
+        <register type="OA" address="0x000027A0" value="0x00018000" />
+        <register type="OA" address="0x000027A4" value="0x0000CFFF" />
+        <register type="OA" address="0x000027A8" value="0x00060000" />
+        <register type="OA" address="0x000027AC" value="0x00003FFF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+    </register_config>
+  </set>
+
+  <set name="Metric set Sampler 2"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="sampler_2"
+       hw_config_guid="afc0f021-8c33-4d60-803d-93487f96c7c1"
+       chipset="ICL"
+       symbol_name="Sampler_2"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="B 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="Slice0 Subslice2 Sampler Output Ready"
+             description="The percentage of time in which slice0 subslice2 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler02_output_ready"
+             units="percent"
+             symbol_name="Sampler02OutputReady"
+             availability="$SubsliceMask 4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Slice0 Subslice6 Sampler Output Ready"
+             description="The percentage of time in which slice0 subslice6 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler06_output_ready"
+             units="percent"
+             symbol_name="Sampler06OutputReady"
+             availability="$SubsliceMask 64 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Slice0 Subslice4 Sampler Output Ready"
+             description="The percentage of time in which slice0 subslice4 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler04_output_ready"
+             units="percent"
+             symbol_name="Sampler04OutputReady"
+             availability="$SubsliceMask 16 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Slice0 Subslice3 Sampler Output Ready"
+             description="The percentage of time in which slice0 subslice3 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler03_output_ready"
+             units="percent"
+             symbol_name="Sampler03OutputReady"
+             availability="$SubsliceMask 8 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 Subslice7 Sampler Output Ready"
+             description="The percentage of time in which slice0 subslice7 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler07_output_ready"
+             units="percent"
+             symbol_name="Sampler07OutputReady"
+             availability="$SubsliceMask 128 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="Slice0 Subslice5 Sampler Output Ready"
+             description="The percentage of time in which slice0 subslice5 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler05_output_ready"
+             units="percent"
+             symbol_name="Sampler05OutputReady"
+             availability="$SubsliceMask 32 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Slice0 Subslice0 Sampler Output Ready"
+             description="The percentage of time in which slice0 subslice0 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler00_output_ready"
+             units="percent"
+             symbol_name="Sampler00OutputReady"
+             availability="$SubsliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Slice0 Subslice1 Sampler Output Ready"
+             description="The percentage of time in which slice0 subslice1 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler01_output_ready"
+             units="percent"
+             symbol_name="Sampler01OutputReady"
+             availability="$SubsliceMask 2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="$ShaderMemoryAccesses 64 UMUL"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009840" value="0x00000000" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x142D0005" />
+        <register type="NOA" address="0x00009888" value="0x14320005" />
+        <register type="NOA" address="0x00009888" value="0x146D0005" />
+        <register type="NOA" address="0x00009888" value="0x14720005" />
+        <register type="NOA" address="0x00009888" value="0x14AD0005" />
+        <register type="NOA" address="0x00009888" value="0x14B20005" />
+        <register type="NOA" address="0x00009888" value="0x14ED0005" />
+        <register type="NOA" address="0x00009888" value="0x14F20005" />
+        <register type="NOA" address="0x00009888" value="0x1C1E000C" />
+        <register type="NOA" address="0x00009888" value="0x0E1F000C" />
+        <register type="NOA" address="0x00009888" value="0x1C200014" />
+        <register type="NOA" address="0x00009888" value="0x16212800" />
+        <register type="NOA" address="0x00009888" value="0x22290010" />
+        <register type="NOA" address="0x00009888" value="0x1A2A00D0" />
+        <register type="NOA" address="0x00009888" value="0x1A2C000A" />
+        <register type="NOA" address="0x00009888" value="0x0E2D0033" />
+        <register type="NOA" address="0x00009888" value="0x022D0000" />
+        <register type="NOA" address="0x00009888" value="0x0E2F8000" />
+        <register type="NOA" address="0x00009888" value="0x1E300080" />
+        <register type="NOA" address="0x00009888" value="0x1A310008" />
+        <register type="NOA" address="0x00009888" value="0x0E321980" />
+        <register type="NOA" address="0x00009888" value="0x02320000" />
+        <register type="NOA" address="0x00009888" value="0x125E8000" />
+        <register type="NOA" address="0x00009888" value="0x145E8000" />
+        <register type="NOA" address="0x00009888" value="0x025F8000" />
+        <register type="NOA" address="0x00009888" value="0x045F8000" />
+        <register type="NOA" address="0x00009888" value="0x02604000" />
+        <register type="NOA" address="0x00009888" value="0x04604000" />
+        <register type="NOA" address="0x00009888" value="0x02618000" />
+        <register type="NOA" address="0x00009888" value="0x04618000" />
+        <register type="NOA" address="0x00009888" value="0x12698000" />
+        <register type="NOA" address="0x00009888" value="0x026A4000" />
+        <register type="NOA" address="0x00009888" value="0x046AC000" />
+        <register type="NOA" address="0x00009888" value="0x066C8000" />
+        <register type="NOA" address="0x00009888" value="0x086C8000" />
+        <register type="NOA" address="0x00009888" value="0x006D1980" />
+        <register type="NOA" address="0x00009888" value="0x026D0000" />
+        <register type="NOA" address="0x00009888" value="0x026F4000" />
+        <register type="NOA" address="0x00009888" value="0x1A702000" />
+        <register type="NOA" address="0x00009888" value="0x08718000" />
+        <register type="NOA" address="0x00009888" value="0x02720033" />
+        <register type="NOA" address="0x00009888" value="0x169E8000" />
+        <register type="NOA" address="0x00009888" value="0x189E4000" />
+        <register type="NOA" address="0x00009888" value="0x069F8000" />
+        <register type="NOA" address="0x00009888" value="0x089F8000" />
+        <register type="NOA" address="0x00009888" value="0x06A04000" />
+        <register type="NOA" address="0x00009888" value="0x08A04000" />
+        <register type="NOA" address="0x00009888" value="0x06A18000" />
+        <register type="NOA" address="0x00009888" value="0x08A18000" />
+        <register type="NOA" address="0x00009888" value="0x16A98000" />
+        <register type="NOA" address="0x00009888" value="0x06AA4000" />
+        <register type="NOA" address="0x00009888" value="0x08AAC000" />
+        <register type="NOA" address="0x00009888" value="0x0AAC8000" />
+        <register type="NOA" address="0x00009888" value="0x0CAC8000" />
+        <register type="NOA" address="0x00009888" value="0x02AD1980" />
+        <register type="NOA" address="0x00009888" value="0x04AF4000" />
+        <register type="NOA" address="0x00009888" value="0x1CB00002" />
+        <register type="NOA" address="0x00009888" value="0x0CB18000" />
+        <register type="NOA" address="0x00009888" value="0x04B20033" />
+        <register type="NOA" address="0x00009888" value="0x02B20000" />
+        <register type="NOA" address="0x00009888" value="0x18DE8000" />
+        <register type="NOA" address="0x00009888" value="0x1ADE0400" />
+        <register type="NOA" address="0x00009888" value="0x0ADF8000" />
+        <register type="NOA" address="0x00009888" value="0x0CDF0400" />
+        <register type="NOA" address="0x00009888" value="0x0AE04000" />
+        <register type="NOA" address="0x00009888" value="0x0CE04000" />
+        <register type="NOA" address="0x00009888" value="0x0AE18000" />
+        <register type="NOA" address="0x00009888" value="0x0CE18000" />
+        <register type="NOA" address="0x00009888" value="0x1EE98000" />
+        <register type="NOA" address="0x00009888" value="0x0AEA4000" />
+        <register type="NOA" address="0x00009888" value="0x0CEAC000" />
+        <register type="NOA" address="0x00009888" value="0x0EEC8000" />
+        <register type="NOA" address="0x00009888" value="0x18EC0002" />
+        <register type="NOA" address="0x00009888" value="0x04ED1980" />
+        <register type="NOA" address="0x00009888" value="0x02ED0000" />
+        <register type="NOA" address="0x00009888" value="0x06EF4000" />
+        <register type="NOA" address="0x00009888" value="0x1CF00020" />
+        <register type="NOA" address="0x00009888" value="0x18F10002" />
+        <register type="NOA" address="0x00009888" value="0x06F20033" />
+        <register type="NOA" address="0x00009888" value="0x02F20000" />
+        <register type="NOA" address="0x00009888" value="0x10040140" />
+        <register type="NOA" address="0x00009888" value="0x0C045000" />
+        <register type="NOA" address="0x00009888" value="0x0E040055" />
+        <register type="NOA" address="0x00009888" value="0x14050050" />
+        <register type="NOA" address="0x00009888" value="0x04054000" />
+        <register type="NOA" address="0x00009888" value="0x06055000" />
+        <register type="NOA" address="0x00009888" value="0x08055000" />
+        <register type="NOA" address="0x00009888" value="0x0A051000" />
+        <register type="NOA" address="0x00009888" value="0x260600C0" />
+        <register type="NOA" address="0x00009888" value="0x24067E00" />
+        <register type="NOA" address="0x00009888" value="0x00088000" />
+        <register type="NOA" address="0x00009888" value="0x02082000" />
+        <register type="NOA" address="0x00009888" value="0x04094000" />
+        <register type="NOA" address="0x00009888" value="0x06091000" />
+        <register type="NOA" address="0x00009888" value="0x040D8000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x080E4000" />
+        <register type="NOA" address="0x00009888" value="0x0A0E1000" />
+        <register type="NOA" address="0x00009888" value="0x02128000" />
+        <register type="NOA" address="0x00009888" value="0x04128000" />
+        <register type="NOA" address="0x00009888" value="0x0612C000" />
+        <register type="NOA" address="0x00009888" value="0x0812C000" />
+        <register type="NOA" address="0x00009888" value="0x0413E000" />
+        <register type="NOA" address="0x00009888" value="0x06131000" />
+        <register type="NOA" address="0x00009888" value="0x00148000" />
+        <register type="NOA" address="0x00009888" value="0x0214C000" />
+        <register type="NOA" address="0x00009888" value="0x04144000" />
+        <register type="NOA" address="0x00009888" value="0x1815000F" />
+        <register type="NOA" address="0x00009888" value="0x02154000" />
+        <register type="NOA" address="0x00009888" value="0x04154000" />
+        <register type="NOA" address="0x00009888" value="0x06154000" />
+        <register type="NOA" address="0x00009888" value="0x08154000" />
+        <register type="NOA" address="0x00009888" value="0x0A158000" />
+        <register type="NOA" address="0x00009888" value="0x0C158000" />
+        <register type="NOA" address="0x00009888" value="0x0E18A000" />
+        <register type="NOA" address="0x00009888" value="0x14190028" />
+        <register type="NOA" address="0x00009888" value="0x021C8000" />
+        <register type="NOA" address="0x00009888" value="0x041C2000" />
+        <register type="NOA" address="0x00009888" value="0x0A1D8000" />
+        <register type="NOA" address="0x00009888" value="0x0C1D2000" />
+        <register type="NOA" address="0x00009884" value="0x00000003" />
+        <register type="NOA" address="0x00009888" value="0x1C1F3000" />
+        <register type="NOA" address="0x00009888" value="0x2A1F0061" />
+        <register type="NOA" address="0x00009888" value="0x181F0000" />
+        <register type="NOA" address="0x00009888" value="0x521F0000" />
+        <register type="NOA" address="0x00009888" value="0x541F0024" />
+        <register type="NOA" address="0x00009888" value="0x3A1F8000" />
+        <register type="NOA" address="0x00009888" value="0x4E1F2430" />
+        <register type="NOA" address="0x00009888" value="0x501F0124" />
+        <register type="NOA" address="0x00009888" value="0x4C1F5047" />
+        <register type="NOA" address="0x00009888" value="0x301F0000" />
+        <register type="NOA" address="0x00009888" value="0x401F0020" />
+        <register type="NOA" address="0x00009888" value="0x421F0020" />
+        <register type="NOA" address="0x00009888" value="0x441F3050" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+    </register_config>
+  </set>
+
+  <set name="Metric set TDL_1"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="tdl_1"
+       hw_config_guid="eddc2f32-b196-4a72-9bf8-21770e35f8bd"
+       chipset="ICL"
+       symbol_name="TDL_1"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Subslice3 Thread Dispatcher"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice3 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread03_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread03ReadyForDispatch"
+             availability="$SubsliceMask 8 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="FS AVG Stall per Thread"
+             description="The average number of cycles per hardware thread run in which fragment shaders were stalled on the EUs."
+             data_type="uint64"
+             equation="A 20 READ A 6 READ UDIV"
+             underscore_name="ps_eu_stall_per_thread"
+             units="cycles"
+             symbol_name="PsEuStallPerThread"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS AVG Stall per Thread"
+             description="The average number of cycles per hardware thread run in which vertex shaders were stalled on the EUs."
+             data_type="uint64"
+             equation="A 14 READ A 1 READ UDIV"
+             underscore_name="vs_eu_stall_per_thread"
+             units="cycles"
+             symbol_name="VsEuStallPerThread"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="FS AVG Active per Thread"
+             description="The average number of cycles per hardware thread run in which fragment shaders were processed actively on the EUs."
+             data_type="uint64"
+             equation="A 19 READ A 6 READ UDIV"
+             underscore_name="ps_eu_active_per_thread"
+             units="cycles"
+             symbol_name="PsEuActivePerThread"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="FS EU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 19 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_active"
+             units="percent"
+             symbol_name="PsEuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Subslice0 Thread Dispatcher"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice0 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread00_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread00ReadyForDispatch"
+             availability="$SubsliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Subslice7 Thread Dispatcher"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice7 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread07_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread07ReadyForDispatch"
+             availability="$SubsliceMask 128 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="FS EU Stall"
+             description="The percentage of time in which fragment shaders were stalled on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 20 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_stall"
+             units="percent"
+             symbol_name="PsEuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Subslice5 Thread Dispatcher"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice5 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread05_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread05ReadyForDispatch"
+             availability="$SubsliceMask 32 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="VS EU Active"
+             description="The percentage of time in which vertex shaders were processed actively on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_eu_active"
+             units="percent"
+             symbol_name="VsEuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Subslice1 Thread Dispatcher"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice1 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread01_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread01ReadyForDispatch"
+             availability="$SubsliceMask 2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Subslice4 Thread Dispatcher"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice4 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread04_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread04ReadyForDispatch"
+             availability="$SubsliceMask 16 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="VS EU Stall"
+             description="The percentage of time in which vertex shaders were stalled on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 14 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_eu_stall"
+             units="percent"
+             symbol_name="VsEuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="VS AVG Active per Thread"
+             description="The average number of cycles per hardware thread run in which vertex shaders were processed actively on the EUs."
+             data_type="uint64"
+             equation="A 13 READ A 1 READ UDIV"
+             underscore_name="vs_eu_active_per_thread"
+             units="cycles"
+             symbol_name="VsEuActivePerThread"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Subslice2 Thread Dispatcher"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice2 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread02_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread02ReadyForDispatch"
+             availability="$SubsliceMask 4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="$ShaderMemoryAccesses 64 UMUL"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Subslice6 Thread Dispatcher"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice6 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread06_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread06ReadyForDispatch"
+             availability="$SubsliceMask 64 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009840" value="0x00000000" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x14290000" />
+        <register type="NOA" address="0x00009888" value="0x142E0000" />
+        <register type="NOA" address="0x00009888" value="0x14690000" />
+        <register type="NOA" address="0x00009888" value="0x146E0000" />
+        <register type="NOA" address="0x00009888" value="0x14A90000" />
+        <register type="NOA" address="0x00009888" value="0x14AE0000" />
+        <register type="NOA" address="0x00009888" value="0x14E90000" />
+        <register type="NOA" address="0x00009888" value="0x14EE0000" />
+        <register type="NOA" address="0x00009888" value="0x161E8000" />
+        <register type="NOA" address="0x00009888" value="0x181EC000" />
+        <register type="NOA" address="0x00009888" value="0x1A1E0400" />
+        <register type="NOA" address="0x00009888" value="0x061F8000" />
+        <register type="NOA" address="0x00009888" value="0x081F8000" />
+        <register type="NOA" address="0x00009888" value="0x0A1F8000" />
+        <register type="NOA" address="0x00009888" value="0x0C1F0400" />
+        <register type="NOA" address="0x00009888" value="0x06204000" />
+        <register type="NOA" address="0x00009888" value="0x08204000" />
+        <register type="NOA" address="0x00009888" value="0x0A204000" />
+        <register type="NOA" address="0x00009888" value="0x0C204000" />
+        <register type="NOA" address="0x00009888" value="0x06218000" />
+        <register type="NOA" address="0x00009888" value="0x08218000" />
+        <register type="NOA" address="0x00009888" value="0x0A218000" />
+        <register type="NOA" address="0x00009888" value="0x0C218000" />
+        <register type="NOA" address="0x00009888" value="0x0429C300" />
+        <register type="NOA" address="0x00009888" value="0x062900C5" />
+        <register type="NOA" address="0x00009888" value="0x22290000" />
+        <register type="NOA" address="0x00009888" value="0x1E290000" />
+        <register type="NOA" address="0x00009888" value="0x20290000" />
+        <register type="NOA" address="0x00009888" value="0x062AC000" />
+        <register type="NOA" address="0x00009888" value="0x082AC000" />
+        <register type="NOA" address="0x00009888" value="0x0A2A4000" />
+        <register type="NOA" address="0x00009888" value="0x0C2A4000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0E2C8000" />
+        <register type="NOA" address="0x00009888" value="0x182C0002" />
+        <register type="NOA" address="0x00009888" value="0x022EC300" />
+        <register type="NOA" address="0x00009888" value="0x042E00C5" />
+        <register type="NOA" address="0x00009888" value="0x102E0000" />
+        <register type="NOA" address="0x00009888" value="0x022F8000" />
+        <register type="NOA" address="0x00009888" value="0x042F4000" />
+        <register type="NOA" address="0x00009888" value="0x1A304000" />
+        <register type="NOA" address="0x00009888" value="0x1C300001" />
+        <register type="NOA" address="0x00009888" value="0x1C5E000C" />
+        <register type="NOA" address="0x00009888" value="0x125E8000" />
+        <register type="NOA" address="0x00009888" value="0x145E8000" />
+        <register type="NOA" address="0x00009888" value="0x0E5F000C" />
+        <register type="NOA" address="0x00009888" value="0x025F8000" />
+        <register type="NOA" address="0x00009888" value="0x045F8000" />
+        <register type="NOA" address="0x00009888" value="0x1C600014" />
+        <register type="NOA" address="0x00009888" value="0x02604000" />
+        <register type="NOA" address="0x00009888" value="0x04604000" />
+        <register type="NOA" address="0x00009888" value="0x16612800" />
+        <register type="NOA" address="0x00009888" value="0x02618000" />
+        <register type="NOA" address="0x00009888" value="0x04618000" />
+        <register type="NOA" address="0x00009888" value="0x0069C300" />
+        <register type="NOA" address="0x00009888" value="0x026900C5" />
+        <register type="NOA" address="0x00009888" value="0x22690000" />
+        <register type="NOA" address="0x00009888" value="0x12690000" />
+        <register type="NOA" address="0x00009888" value="0x1A6A00F0" />
+        <register type="NOA" address="0x00009888" value="0x026A4000" />
+        <register type="NOA" address="0x00009888" value="0x046A4000" />
+        <register type="NOA" address="0x00009888" value="0x1A6C000A" />
+        <register type="NOA" address="0x00009888" value="0x066C8000" />
+        <register type="NOA" address="0x00009888" value="0x086C8000" />
+        <register type="NOA" address="0x00009888" value="0x0E6EC5C3" />
+        <register type="NOA" address="0x00009888" value="0x106E0000" />
+        <register type="NOA" address="0x00009888" value="0x0E6FC000" />
+        <register type="NOA" address="0x00009888" value="0x1E700050" />
+        <register type="NOA" address="0x00009888" value="0x1A9EC000" />
+        <register type="NOA" address="0x00009888" value="0x1C9E0003" />
+        <register type="NOA" address="0x00009888" value="0x0C9FC000" />
+        <register type="NOA" address="0x00009888" value="0x0E9F0003" />
+        <register type="NOA" address="0x00009888" value="0x1AA02A00" />
+        <register type="NOA" address="0x00009888" value="0x1CA00001" />
+        <register type="NOA" address="0x00009888" value="0x16A102A8" />
+        <register type="NOA" address="0x00009888" value="0x0CA9C5C3" />
+        <register type="NOA" address="0x00009888" value="0x22A90000" />
+        <register type="NOA" address="0x00009888" value="0x18AAF000" />
+        <register type="NOA" address="0x00009888" value="0x1AAA0005" />
+        <register type="NOA" address="0x00009888" value="0x18ACAA00" />
+        <register type="NOA" address="0x00009888" value="0x0AAEC5C3" />
+        <register type="NOA" address="0x00009888" value="0x10AE0000" />
+        <register type="NOA" address="0x00009888" value="0x0AAFC000" />
+        <register type="NOA" address="0x00009888" value="0x1CB05000" />
+        <register type="NOA" address="0x00009888" value="0x10DE8000" />
+        <register type="NOA" address="0x00009888" value="0x1ADE3800" />
+        <register type="NOA" address="0x00009888" value="0x00DF8000" />
+        <register type="NOA" address="0x00009888" value="0x0CDF3800" />
+        <register type="NOA" address="0x00009888" value="0x00E04000" />
+        <register type="NOA" address="0x00009888" value="0x0EE04000" />
+        <register type="NOA" address="0x00009888" value="0x1AE000A0" />
+        <register type="NOA" address="0x00009888" value="0x00E18000" />
+        <register type="NOA" address="0x00009888" value="0x0EE18000" />
+        <register type="NOA" address="0x00009888" value="0x14E18000" />
+        <register type="NOA" address="0x00009888" value="0x16E10002" />
+        <register type="NOA" address="0x00009888" value="0x08E9C5C3" />
+        <register type="NOA" address="0x00009888" value="0x22E90000" />
+        <register type="NOA" address="0x00009888" value="0x20E90000" />
+        <register type="NOA" address="0x00009888" value="0x00EAC000" />
+        <register type="NOA" address="0x00009888" value="0x0EEAC000" />
+        <register type="NOA" address="0x00009888" value="0x18EA0500" />
+        <register type="NOA" address="0x00009888" value="0x04EC8000" />
+        <register type="NOA" address="0x00009888" value="0x18EC00A8" />
+        <register type="NOA" address="0x00009888" value="0x00EE00C3" />
+        <register type="NOA" address="0x00009888" value="0x06EEC500" />
+        <register type="NOA" address="0x00009888" value="0x10EE0000" />
+        <register type="NOA" address="0x00009888" value="0x00EF4000" />
+        <register type="NOA" address="0x00009888" value="0x06EF8000" />
+        <register type="NOA" address="0x00009888" value="0x18F04000" />
+        <register type="NOA" address="0x00009888" value="0x1CF00040" />
+        <register type="NOA" address="0x00009888" value="0x0C045400" />
+        <register type="NOA" address="0x00009888" value="0x0E045555" />
+        <register type="NOA" address="0x00009888" value="0x10040155" />
+        <register type="NOA" address="0x00009888" value="0x04055000" />
+        <register type="NOA" address="0x00009888" value="0x0A055000" />
+        <register type="NOA" address="0x00009888" value="0x0C055000" />
+        <register type="NOA" address="0x00009888" value="0x0E055000" />
+        <register type="NOA" address="0x00009888" value="0x14050055" />
+        <register type="NOA" address="0x00009888" value="0x06055000" />
+        <register type="NOA" address="0x00009888" value="0x08055000" />
+        <register type="NOA" address="0x00009888" value="0x2406FF00" />
+        <register type="NOA" address="0x00009888" value="0x260600FF" />
+        <register type="NOA" address="0x00009888" value="0x0E08A000" />
+        <register type="NOA" address="0x00009888" value="0x00088000" />
+        <register type="NOA" address="0x00009888" value="0x02082000" />
+        <register type="NOA" address="0x00009888" value="0x14090050" />
+        <register type="NOA" address="0x00009888" value="0x04094000" />
+        <register type="NOA" address="0x00009888" value="0x06091000" />
+        <register type="NOA" address="0x00009888" value="0x000D2000" />
+        <register type="NOA" address="0x00009888" value="0x060D8000" />
+        <register type="NOA" address="0x00009888" value="0x080DA000" />
+        <register type="NOA" address="0x00009888" value="0x040E1000" />
+        <register type="NOA" address="0x00009888" value="0x0A0E4000" />
+        <register type="NOA" address="0x00009888" value="0x0C0E5000" />
+        <register type="NOA" address="0x00009888" value="0x1812FC00" />
+        <register type="NOA" address="0x00009888" value="0x1A12002B" />
+        <register type="NOA" address="0x00009888" value="0x02128000" />
+        <register type="NOA" address="0x00009888" value="0x04128000" />
+        <register type="NOA" address="0x00009888" value="0x0813C000" />
+        <register type="NOA" address="0x00009888" value="0x0A13F000" />
+        <register type="NOA" address="0x00009888" value="0x04136000" />
+        <register type="NOA" address="0x00009888" value="0x0A14C000" />
+        <register type="NOA" address="0x00009888" value="0x0C14C000" />
+        <register type="NOA" address="0x00009888" value="0x0E14C000" />
+        <register type="NOA" address="0x00009888" value="0x00148000" />
+        <register type="NOA" address="0x00009888" value="0x02144000" />
+        <register type="NOA" address="0x00009888" value="0x00158000" />
+        <register type="NOA" address="0x00009888" value="0x0E158000" />
+        <register type="NOA" address="0x00009888" value="0x16152AD0" />
+        <register type="NOA" address="0x00009888" value="0x18150005" />
+        <register type="NOA" address="0x00009888" value="0x02154000" />
+        <register type="NOA" address="0x00009888" value="0x04154000" />
+        <register type="NOA" address="0x00009888" value="0x0615C000" />
+        <register type="NOA" address="0x00009888" value="0x0815C000" />
+        <register type="NOA" address="0x00009888" value="0x0A15C000" />
+        <register type="NOA" address="0x00009888" value="0x0C15C000" />
+        <register type="NOA" address="0x00009888" value="0x02188000" />
+        <register type="NOA" address="0x00009888" value="0x0418A000" />
+        <register type="NOA" address="0x00009888" value="0x06182000" />
+        <register type="NOA" address="0x00009888" value="0x0A198000" />
+        <register type="NOA" address="0x00009888" value="0x0C19A000" />
+        <register type="NOA" address="0x00009888" value="0x0E192000" />
+        <register type="NOA" address="0x00009888" value="0x0A1CA000" />
+        <register type="NOA" address="0x00009888" value="0x0C1CA000" />
+        <register type="NOA" address="0x00009888" value="0x121D5400" />
+        <register type="NOA" address="0x00009888" value="0x141D0002" />
+        <register type="NOA" address="0x00009884" value="0x00000003" />
+        <register type="NOA" address="0x00009888" value="0x301F8000" />
+        <register type="NOA" address="0x00009888" value="0x501F4924" />
+        <register type="NOA" address="0x00009888" value="0x521F4924" />
+        <register type="NOA" address="0x00009888" value="0x541F0024" />
+        <register type="NOA" address="0x00009888" value="0x3A1F8000" />
+        <register type="NOA" address="0x00009888" value="0x4E1F2400" />
+        <register type="NOA" address="0x00009888" value="0x3E1F3000" />
+        <register type="NOA" address="0x00009888" value="0x461F5030" />
+        <register type="NOA" address="0x00009888" value="0x481F0050" />
+        <register type="NOA" address="0x00009888" value="0x4A1F2000" />
+        <register type="NOA" address="0x00009888" value="0x4C1F0020" />
+        <register type="NOA" address="0x00009888" value="0x181F0000" />
+        <register type="NOA" address="0x00009888" value="0x401F2020" />
+        <register type="NOA" address="0x00009888" value="0x421F3030" />
+        <register type="NOA" address="0x00009888" value="0x441F5050" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002770" value="0x00000018" />
+        <register type="OA" address="0x00002774" value="0x0000FFFC" />
+        <register type="OA" address="0x00002778" value="0x00000060" />
+        <register type="OA" address="0x0000277C" value="0x0000FFF3" />
+        <register type="OA" address="0x00002780" value="0x00000180" />
+        <register type="OA" address="0x00002784" value="0x0000FFCF" />
+        <register type="OA" address="0x00002788" value="0x00000600" />
+        <register type="OA" address="0x0000278C" value="0x0000FF3F" />
+        <register type="OA" address="0x00002790" value="0x00001800" />
+        <register type="OA" address="0x00002794" value="0x0000FCFF" />
+        <register type="OA" address="0x00002798" value="0x00006000" />
+        <register type="OA" address="0x0000279C" value="0x0000F3FF" />
+        <register type="OA" address="0x000027A0" value="0x00018000" />
+        <register type="OA" address="0x000027A4" value="0x0000CFFF" />
+        <register type="OA" address="0x000027A8" value="0x00060000" />
+        <register type="OA" address="0x000027AC" value="0x00003FFF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set TDL_2"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="tdl_2"
+       hw_config_guid="c6d3af7b-037b-4656-95e1-4f838f0a2c14"
+       chipset="ICL"
+       symbol_name="TDL_2"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Non-PS Thread Ready For Dispatch on Slice0 Subslice2 Thread Dispatcher"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice2 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="GPU_CLOCK 0 READ C 1 READ FSUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread02_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread02ReadyForDispatch"
+             availability="$SubsliceMask 4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Non-PS Thread Ready For Dispatch on Slice0 Subslice3 Thread Dispatcher"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice3 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="GPU_CLOCK 0 READ C 2 READ FSUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread03_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread03ReadyForDispatch"
+             availability="$SubsliceMask 8 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="Non-PS Thread Ready For Dispatch on Slice0 Subslice0 Thread Dispatcher"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice0 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="GPU_CLOCK 0 READ B 7 READ FSUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread00_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread00ReadyForDispatch"
+             availability="$SubsliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Non-PS Thread Ready For Dispatch on Slice0 Subslice7 Thread Dispatcher"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice7 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="GPU_CLOCK 0 READ C 6 READ FSUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread07_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread07ReadyForDispatch"
+             availability="$SubsliceMask 128 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Non-PS Thread Ready For Dispatch on Slice0 Subslice6 Thread Dispatcher"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice6 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="GPU_CLOCK 0 READ C 5 READ FSUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread06_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread06ReadyForDispatch"
+             availability="$SubsliceMask 64 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="Non-PS Thread Ready For Dispatch on Slice0 Subslice5 Thread Dispatcher"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice5 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="GPU_CLOCK 0 READ C 4 READ FSUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread05_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread05ReadyForDispatch"
+             availability="$SubsliceMask 32 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Non-PS Thread Ready For Dispatch on Slice0 Subslice4 Thread Dispatcher"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice4 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="GPU_CLOCK 0 READ C 3 READ FSUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread04_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread04ReadyForDispatch"
+             availability="$SubsliceMask 16 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="$ShaderMemoryAccesses 64 UMUL"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="Non-PS Thread Ready For Dispatch on Slice0 Subslice1 Thread Dispatcher"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice1 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="GPU_CLOCK 0 READ C 0 READ FSUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread01_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread01ReadyForDispatch"
+             availability="$SubsliceMask 2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009840" value="0x00000000" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x14290000" />
+        <register type="NOA" address="0x00009888" value="0x142E0000" />
+        <register type="NOA" address="0x00009888" value="0x14690000" />
+        <register type="NOA" address="0x00009888" value="0x146E0000" />
+        <register type="NOA" address="0x00009888" value="0x14A90000" />
+        <register type="NOA" address="0x00009888" value="0x14AE0000" />
+        <register type="NOA" address="0x00009888" value="0x14E90000" />
+        <register type="NOA" address="0x00009888" value="0x14EE0000" />
+        <register type="NOA" address="0x00009888" value="0x1C1E0006" />
+        <register type="NOA" address="0x00009888" value="0x0E1F0006" />
+        <register type="NOA" address="0x00009888" value="0x1C200005" />
+        <register type="NOA" address="0x00009888" value="0x16210A00" />
+        <register type="NOA" address="0x00009888" value="0x0C29C100" />
+        <register type="NOA" address="0x00009888" value="0x22290000" />
+        <register type="NOA" address="0x00009888" value="0x1A2A0034" />
+        <register type="NOA" address="0x00009888" value="0x182C8000" />
+        <register type="NOA" address="0x00009888" value="0x1A2C0002" />
+        <register type="NOA" address="0x00009888" value="0x0E2E00C1" />
+        <register type="NOA" address="0x00009888" value="0x102E0000" />
+        <register type="NOA" address="0x00009888" value="0x0E2F4000" />
+        <register type="NOA" address="0x00009888" value="0x1E300010" />
+        <register type="NOA" address="0x00009888" value="0x1C5E0008" />
+        <register type="NOA" address="0x00009888" value="0x125E8000" />
+        <register type="NOA" address="0x00009888" value="0x0E5F0008" />
+        <register type="NOA" address="0x00009888" value="0x025F8000" />
+        <register type="NOA" address="0x00009888" value="0x1C600010" />
+        <register type="NOA" address="0x00009888" value="0x02604000" />
+        <register type="NOA" address="0x00009888" value="0x16612000" />
+        <register type="NOA" address="0x00009888" value="0x02618000" />
+        <register type="NOA" address="0x00009888" value="0x0E69C100" />
+        <register type="NOA" address="0x00009888" value="0x22690000" />
+        <register type="NOA" address="0x00009888" value="0x1A6A0040" />
+        <register type="NOA" address="0x00009888" value="0x026AC000" />
+        <register type="NOA" address="0x00009888" value="0x1A6C0008" />
+        <register type="NOA" address="0x00009888" value="0x066C8000" />
+        <register type="NOA" address="0x00009888" value="0x006EC100" />
+        <register type="NOA" address="0x00009888" value="0x106E0000" />
+        <register type="NOA" address="0x00009888" value="0x006F8000" />
+        <register type="NOA" address="0x00009888" value="0x1A700400" />
+        <register type="NOA" address="0x00009888" value="0x149E8000" />
+        <register type="NOA" address="0x00009888" value="0x169E8000" />
+        <register type="NOA" address="0x00009888" value="0x049F8000" />
+        <register type="NOA" address="0x00009888" value="0x069F8000" />
+        <register type="NOA" address="0x00009888" value="0x04A04000" />
+        <register type="NOA" address="0x00009888" value="0x06A04000" />
+        <register type="NOA" address="0x00009888" value="0x04A18000" />
+        <register type="NOA" address="0x00009888" value="0x06A18000" />
+        <register type="NOA" address="0x00009888" value="0x02A900C1" />
+        <register type="NOA" address="0x00009888" value="0x22A90000" />
+        <register type="NOA" address="0x00009888" value="0x04AA4000" />
+        <register type="NOA" address="0x00009888" value="0x06AAC000" />
+        <register type="NOA" address="0x00009888" value="0x08AC8000" />
+        <register type="NOA" address="0x00009888" value="0x0AAC8000" />
+        <register type="NOA" address="0x00009888" value="0x02AEC100" />
+        <register type="NOA" address="0x00009888" value="0x10AE0000" />
+        <register type="NOA" address="0x00009888" value="0x02AF8000" />
+        <register type="NOA" address="0x00009888" value="0x1AB04000" />
+        <register type="NOA" address="0x00009888" value="0x18DEC000" />
+        <register type="NOA" address="0x00009888" value="0x08DF8000" />
+        <register type="NOA" address="0x00009888" value="0x0ADF8000" />
+        <register type="NOA" address="0x00009888" value="0x08E04000" />
+        <register type="NOA" address="0x00009888" value="0x0AE04000" />
+        <register type="NOA" address="0x00009888" value="0x08E18000" />
+        <register type="NOA" address="0x00009888" value="0x0AE18000" />
+        <register type="NOA" address="0x00009888" value="0x04E900C1" />
+        <register type="NOA" address="0x00009888" value="0x22E90000" />
+        <register type="NOA" address="0x00009888" value="0x1CE90000" />
+        <register type="NOA" address="0x00009888" value="0x08EA4000" />
+        <register type="NOA" address="0x00009888" value="0x0AEAC000" />
+        <register type="NOA" address="0x00009888" value="0x0CEC8000" />
+        <register type="NOA" address="0x00009888" value="0x0EEC8000" />
+        <register type="NOA" address="0x00009888" value="0x04EEC100" />
+        <register type="NOA" address="0x00009888" value="0x10EE0000" />
+        <register type="NOA" address="0x00009888" value="0x04EF8000" />
+        <register type="NOA" address="0x00009888" value="0x1CF00004" />
+        <register type="NOA" address="0x00009888" value="0x10040150" />
+        <register type="NOA" address="0x00009888" value="0x0C045000" />
+        <register type="NOA" address="0x00009888" value="0x0E040015" />
+        <register type="NOA" address="0x00009888" value="0x14050054" />
+        <register type="NOA" address="0x00009888" value="0x04054000" />
+        <register type="NOA" address="0x00009888" value="0x06055000" />
+        <register type="NOA" address="0x00009888" value="0x08055000" />
+        <register type="NOA" address="0x00009888" value="0x260600E0" />
+        <register type="NOA" address="0x00009888" value="0x24063E00" />
+        <register type="NOA" address="0x00009888" value="0x0E088000" />
+        <register type="NOA" address="0x00009888" value="0x00088000" />
+        <register type="NOA" address="0x00009888" value="0x14090040" />
+        <register type="NOA" address="0x00009888" value="0x04094000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x080E5000" />
+        <register type="NOA" address="0x00009888" value="0x1A120020" />
+        <register type="NOA" address="0x00009888" value="0x02128000" />
+        <register type="NOA" address="0x00009888" value="0x0412C000" />
+        <register type="NOA" address="0x00009888" value="0x0612C000" />
+        <register type="NOA" address="0x00009888" value="0x0A138000" />
+        <register type="NOA" address="0x00009888" value="0x0413E000" />
+        <register type="NOA" address="0x00009888" value="0x0E148000" />
+        <register type="NOA" address="0x00009888" value="0x00148000" />
+        <register type="NOA" address="0x00009888" value="0x0214C000" />
+        <register type="NOA" address="0x00009888" value="0x16156000" />
+        <register type="NOA" address="0x00009888" value="0x18150007" />
+        <register type="NOA" address="0x00009888" value="0x02154000" />
+        <register type="NOA" address="0x00009888" value="0x04154000" />
+        <register type="NOA" address="0x00009888" value="0x06154000" />
+        <register type="NOA" address="0x00009888" value="0x08158000" />
+        <register type="NOA" address="0x00009888" value="0x0A158000" />
+        <register type="NOA" address="0x00009888" value="0x0C188000" />
+        <register type="NOA" address="0x00009888" value="0x0E182000" />
+        <register type="NOA" address="0x00009888" value="0x1419000A" />
+        <register type="NOA" address="0x00009888" value="0x021CA000" />
+        <register type="NOA" address="0x00009888" value="0x0A1DA000" />
+        <register type="NOA" address="0x00009884" value="0x00000003" />
+        <register type="NOA" address="0x00009888" value="0x1C1F3061" />
+        <register type="NOA" address="0x00009888" value="0x181F0000" />
+        <register type="NOA" address="0x00009888" value="0x521F4000" />
+        <register type="NOA" address="0x00009888" value="0x541F0024" />
+        <register type="NOA" address="0x00009888" value="0x3A1F8000" />
+        <register type="NOA" address="0x00009888" value="0x4E1F2420" />
+        <register type="NOA" address="0x00009888" value="0x501F0024" />
+        <register type="NOA" address="0x00009888" value="0x4C1F3050" />
+        <register type="NOA" address="0x00009888" value="0x301F0000" />
+        <register type="NOA" address="0x00009888" value="0x401F2000" />
+        <register type="NOA" address="0x00009888" value="0x421F5000" />
+        <register type="NOA" address="0x00009888" value="0x441F3730" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+    </register_config>
+  </set>
+
+  <set name="Metric set TDL_3"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="tdl_3"
+       hw_config_guid="fd25ec19-3ed1-40c9-8648-1d2387449a92"
+       chipset="ICL"
+       symbol_name="TDL_3"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice6 Thread Dispatcher Port 1"
+             description="The percentage of time in which thread header is ready on slice0 subslice6 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header06_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader06ReadyPort1"
+             availability="$SubsliceMask 64 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice3 Thread Dispatcher Port 0"
+             description="The percentage of time in which thread header is ready on slice0 subslice3 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="B 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header03_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader03ReadyPort0"
+             availability="$SubsliceMask 8 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice3 Thread Dispatcher Port 1"
+             description="The percentage of time in which thread header is ready on slice0 subslice3 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="B 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header03_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader03ReadyPort1"
+             availability="$SubsliceMask 8 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice4 Thread Dispatcher Port 1"
+             description="The percentage of time in which thread header is ready on slice0 subslice4 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header04_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader04ReadyPort1"
+             availability="$SubsliceMask 16 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice4 Thread Dispatcher Port 0"
+             description="The percentage of time in which thread header is ready on slice0 subslice4 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header04_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader04ReadyPort0"
+             availability="$SubsliceMask 16 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice6 Thread Dispatcher Port 0"
+             description="The percentage of time in which thread header is ready on slice0 subslice6 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header06_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader06ReadyPort0"
+             availability="$SubsliceMask 64 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice1 Thread Dispatcher Port 0"
+             description="The percentage of time in which thread header is ready on slice0 subslice1 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header01_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader01ReadyPort0"
+             availability="$SubsliceMask 2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice1 Thread Dispatcher Port 1"
+             description="The percentage of time in which thread header is ready on slice0 subslice1 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header01_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader01ReadyPort1"
+             availability="$SubsliceMask 2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice7 Thread Dispatcher Port 0"
+             description="The percentage of time in which thread header is ready on slice0 subslice7 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header07_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader07ReadyPort0"
+             availability="$SubsliceMask 128 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice2 Thread Dispatcher Port 1"
+             description="The percentage of time in which thread header is ready on slice0 subslice2 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="B 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header02_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader02ReadyPort1"
+             availability="$SubsliceMask 4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice2 Thread Dispatcher Port 0"
+             description="The percentage of time in which thread header is ready on slice0 subslice2 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header02_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader02ReadyPort0"
+             availability="$SubsliceMask 4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice5 Thread Dispatcher Port 0"
+             description="The percentage of time in which thread header is ready on slice0 subslice5 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header05_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader05ReadyPort0"
+             availability="$SubsliceMask 32 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice7 Thread Dispatcher Port 1"
+             description="The percentage of time in which thread header is ready on slice0 subslice7 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header07_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader07ReadyPort1"
+             availability="$SubsliceMask 128 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="$ShaderMemoryAccesses 64 UMUL"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice5 Thread Dispatcher Port 1"
+             description="The percentage of time in which thread header is ready on slice0 subslice5 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header05_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader05ReadyPort1"
+             availability="$SubsliceMask 32 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice0 Thread Dispatcher Port 0"
+             description="The percentage of time in which thread header is ready on slice0 subslice0 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header00_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader00ReadyPort0"
+             availability="$SubsliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice0 Thread Dispatcher Port 1"
+             description="The percentage of time in which thread header is ready on slice0 subslice0 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header00_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader00ReadyPort1"
+             availability="$SubsliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009840" value="0x00000000" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x14292C00" />
+        <register type="NOA" address="0x00009888" value="0x16290013" />
+        <register type="NOA" address="0x00009888" value="0x142E2C00" />
+        <register type="NOA" address="0x00009888" value="0x162E0013" />
+        <register type="NOA" address="0x00009888" value="0x14692C00" />
+        <register type="NOA" address="0x00009888" value="0x16690013" />
+        <register type="NOA" address="0x00009888" value="0x146E2C00" />
+        <register type="NOA" address="0x00009888" value="0x166E0013" />
+        <register type="NOA" address="0x00009888" value="0x14A92C00" />
+        <register type="NOA" address="0x00009888" value="0x16A90013" />
+        <register type="NOA" address="0x00009888" value="0x14AE2C00" />
+        <register type="NOA" address="0x00009888" value="0x16AE0013" />
+        <register type="NOA" address="0x00009888" value="0x14E92C00" />
+        <register type="NOA" address="0x00009888" value="0x16E90013" />
+        <register type="NOA" address="0x00009888" value="0x14EE2C00" />
+        <register type="NOA" address="0x00009888" value="0x16EE0013" />
+        <register type="NOA" address="0x00009888" value="0x101E8000" />
+        <register type="NOA" address="0x00009888" value="0x1A1E3800" />
+        <register type="NOA" address="0x00009888" value="0x001F8000" />
+        <register type="NOA" address="0x00009888" value="0x0C1F3800" />
+        <register type="NOA" address="0x00009888" value="0x00204000" />
+        <register type="NOA" address="0x00009888" value="0x0E204000" />
+        <register type="NOA" address="0x00009888" value="0x1A2000A0" />
+        <register type="NOA" address="0x00009888" value="0x00218000" />
+        <register type="NOA" address="0x00009888" value="0x0E218000" />
+        <register type="NOA" address="0x00009888" value="0x14218000" />
+        <register type="NOA" address="0x00009888" value="0x16210002" />
+        <register type="NOA" address="0x00009888" value="0x002900C7" />
+        <register type="NOA" address="0x00009888" value="0x0629CF00" />
+        <register type="NOA" address="0x00009888" value="0x22290000" />
+        <register type="NOA" address="0x00009888" value="0x10290000" />
+        <register type="NOA" address="0x00009888" value="0x20290000" />
+        <register type="NOA" address="0x00009888" value="0x002A4000" />
+        <register type="NOA" address="0x00009888" value="0x0E2A4000" />
+        <register type="NOA" address="0x00009888" value="0x182A0F00" />
+        <register type="NOA" address="0x00009888" value="0x042C8000" />
+        <register type="NOA" address="0x00009888" value="0x182C00A8" />
+        <register type="NOA" address="0x00009888" value="0x082ECFC7" />
+        <register type="NOA" address="0x00009888" value="0x102E0000" />
+        <register type="NOA" address="0x00009888" value="0x082FC000" />
+        <register type="NOA" address="0x00009888" value="0x1C300500" />
+        <register type="NOA" address="0x00009888" value="0x1A5EC000" />
+        <register type="NOA" address="0x00009888" value="0x1C5E0003" />
+        <register type="NOA" address="0x00009888" value="0x0C5FC000" />
+        <register type="NOA" address="0x00009888" value="0x0E5F0003" />
+        <register type="NOA" address="0x00009888" value="0x1A602A00" />
+        <register type="NOA" address="0x00009888" value="0x1C600001" />
+        <register type="NOA" address="0x00009888" value="0x166102A8" />
+        <register type="NOA" address="0x00009888" value="0x0A69CFC7" />
+        <register type="NOA" address="0x00009888" value="0x22690000" />
+        <register type="NOA" address="0x00009888" value="0x186A5000" />
+        <register type="NOA" address="0x00009888" value="0x1A6A000F" />
+        <register type="NOA" address="0x00009888" value="0x186CAA00" />
+        <register type="NOA" address="0x00009888" value="0x0C6ECFC7" />
+        <register type="NOA" address="0x00009888" value="0x106E0000" />
+        <register type="NOA" address="0x00009888" value="0x0C6FC000" />
+        <register type="NOA" address="0x00009888" value="0x1E700005" />
+        <register type="NOA" address="0x00009888" value="0x1C9E000C" />
+        <register type="NOA" address="0x00009888" value="0x129E8000" />
+        <register type="NOA" address="0x00009888" value="0x149E8000" />
+        <register type="NOA" address="0x00009888" value="0x0E9F000C" />
+        <register type="NOA" address="0x00009888" value="0x029F8000" />
+        <register type="NOA" address="0x00009888" value="0x049F8000" />
+        <register type="NOA" address="0x00009888" value="0x1CA00014" />
+        <register type="NOA" address="0x00009888" value="0x02A04000" />
+        <register type="NOA" address="0x00009888" value="0x04A04000" />
+        <register type="NOA" address="0x00009888" value="0x16A12800" />
+        <register type="NOA" address="0x00009888" value="0x02A18000" />
+        <register type="NOA" address="0x00009888" value="0x04A18000" />
+        <register type="NOA" address="0x00009888" value="0x0EA9CFC7" />
+        <register type="NOA" address="0x00009888" value="0x22A90000" />
+        <register type="NOA" address="0x00009888" value="0x1AAA0050" />
+        <register type="NOA" address="0x00009888" value="0x02AAC000" />
+        <register type="NOA" address="0x00009888" value="0x04AAC000" />
+        <register type="NOA" address="0x00009888" value="0x1AAC000A" />
+        <register type="NOA" address="0x00009888" value="0x06AC8000" />
+        <register type="NOA" address="0x00009888" value="0x08AC8000" />
+        <register type="NOA" address="0x00009888" value="0x00AEC700" />
+        <register type="NOA" address="0x00009888" value="0x02AE00CF" />
+        <register type="NOA" address="0x00009888" value="0x10AE0000" />
+        <register type="NOA" address="0x00009888" value="0x00AF8000" />
+        <register type="NOA" address="0x00009888" value="0x02AF4000" />
+        <register type="NOA" address="0x00009888" value="0x1AB01400" />
+        <register type="NOA" address="0x00009888" value="0x16DE8000" />
+        <register type="NOA" address="0x00009888" value="0x18DEC000" />
+        <register type="NOA" address="0x00009888" value="0x1ADE0400" />
+        <register type="NOA" address="0x00009888" value="0x06DF8000" />
+        <register type="NOA" address="0x00009888" value="0x08DF8000" />
+        <register type="NOA" address="0x00009888" value="0x0ADF8000" />
+        <register type="NOA" address="0x00009888" value="0x0CDF0400" />
+        <register type="NOA" address="0x00009888" value="0x06E04000" />
+        <register type="NOA" address="0x00009888" value="0x08E04000" />
+        <register type="NOA" address="0x00009888" value="0x0AE04000" />
+        <register type="NOA" address="0x00009888" value="0x0CE04000" />
+        <register type="NOA" address="0x00009888" value="0x06E18000" />
+        <register type="NOA" address="0x00009888" value="0x08E18000" />
+        <register type="NOA" address="0x00009888" value="0x0AE18000" />
+        <register type="NOA" address="0x00009888" value="0x0CE18000" />
+        <register type="NOA" address="0x00009888" value="0x02E9C700" />
+        <register type="NOA" address="0x00009888" value="0x04E900CF" />
+        <register type="NOA" address="0x00009888" value="0x22E90000" />
+        <register type="NOA" address="0x00009888" value="0x1CE90000" />
+        <register type="NOA" address="0x00009888" value="0x06EA4000" />
+        <register type="NOA" address="0x00009888" value="0x08EA4000" />
+        <register type="NOA" address="0x00009888" value="0x0AEAC000" />
+        <register type="NOA" address="0x00009888" value="0x0CEAC000" />
+        <register type="NOA" address="0x00009888" value="0x0AEC8000" />
+        <register type="NOA" address="0x00009888" value="0x0CEC8000" />
+        <register type="NOA" address="0x00009888" value="0x0EEC8000" />
+        <register type="NOA" address="0x00009888" value="0x18EC0002" />
+        <register type="NOA" address="0x00009888" value="0x04EEC700" />
+        <register type="NOA" address="0x00009888" value="0x06EE00CF" />
+        <register type="NOA" address="0x00009888" value="0x10EE0000" />
+        <register type="NOA" address="0x00009888" value="0x04EF8000" />
+        <register type="NOA" address="0x00009888" value="0x06EF4000" />
+        <register type="NOA" address="0x00009888" value="0x1CF00014" />
+        <register type="NOA" address="0x00009888" value="0x0C045400" />
+        <register type="NOA" address="0x00009888" value="0x0E045555" />
+        <register type="NOA" address="0x00009888" value="0x10040155" />
+        <register type="NOA" address="0x00009888" value="0x04055000" />
+        <register type="NOA" address="0x00009888" value="0x0A055000" />
+        <register type="NOA" address="0x00009888" value="0x0C055000" />
+        <register type="NOA" address="0x00009888" value="0x0E055000" />
+        <register type="NOA" address="0x00009888" value="0x14050055" />
+        <register type="NOA" address="0x00009888" value="0x06055000" />
+        <register type="NOA" address="0x00009888" value="0x08055000" />
+        <register type="NOA" address="0x00009888" value="0x2406FF00" />
+        <register type="NOA" address="0x00009888" value="0x260600FF" />
+        <register type="NOA" address="0x00009888" value="0x0A08A000" />
+        <register type="NOA" address="0x00009888" value="0x0C08A000" />
+        <register type="NOA" address="0x00009888" value="0x0E095000" />
+        <register type="NOA" address="0x00009888" value="0x14090005" />
+        <register type="NOA" address="0x00009888" value="0x020D8000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x060E4000" />
+        <register type="NOA" address="0x00009888" value="0x080E5000" />
+        <register type="NOA" address="0x00009888" value="0x0A0E1000" />
+        <register type="NOA" address="0x00009888" value="0x1812A800" />
+        <register type="NOA" address="0x00009888" value="0x1A12003E" />
+        <register type="NOA" address="0x00009888" value="0x0212C000" />
+        <register type="NOA" address="0x00009888" value="0x0412C000" />
+        <register type="NOA" address="0x00009888" value="0x0813C000" />
+        <register type="NOA" address="0x00009888" value="0x0A13F000" />
+        <register type="NOA" address="0x00009888" value="0x04136000" />
+        <register type="NOA" address="0x00009888" value="0x0A14C000" />
+        <register type="NOA" address="0x00009888" value="0x0C14C000" />
+        <register type="NOA" address="0x00009888" value="0x0E14C000" />
+        <register type="NOA" address="0x00009888" value="0x00148000" />
+        <register type="NOA" address="0x00009888" value="0x02144000" />
+        <register type="NOA" address="0x00009888" value="0x0015C000" />
+        <register type="NOA" address="0x00009888" value="0x0E15C000" />
+        <register type="NOA" address="0x00009888" value="0x16152AF8" />
+        <register type="NOA" address="0x00009888" value="0x18150005" />
+        <register type="NOA" address="0x00009888" value="0x02154000" />
+        <register type="NOA" address="0x00009888" value="0x04154000" />
+        <register type="NOA" address="0x00009888" value="0x06158000" />
+        <register type="NOA" address="0x00009888" value="0x08158000" />
+        <register type="NOA" address="0x00009888" value="0x0A158000" />
+        <register type="NOA" address="0x00009888" value="0x0C158000" />
+        <register type="NOA" address="0x00009888" value="0x00182000" />
+        <register type="NOA" address="0x00009888" value="0x06188000" />
+        <register type="NOA" address="0x00009888" value="0x0818A000" />
+        <register type="NOA" address="0x00009888" value="0x08192000" />
+        <register type="NOA" address="0x00009888" value="0x0E198000" />
+        <register type="NOA" address="0x00009888" value="0x12190140" />
+        <register type="NOA" address="0x00009888" value="0x0E1CA000" />
+        <register type="NOA" address="0x00009888" value="0x001C8000" />
+        <register type="NOA" address="0x00009888" value="0x021C2000" />
+        <register type="NOA" address="0x00009888" value="0x141D0028" />
+        <register type="NOA" address="0x00009888" value="0x081D8000" />
+        <register type="NOA" address="0x00009888" value="0x0A1D2000" />
+        <register type="NOA" address="0x00009884" value="0x00000003" />
+        <register type="NOA" address="0x00009888" value="0x301F8000" />
+        <register type="NOA" address="0x00009888" value="0x501F4924" />
+        <register type="NOA" address="0x00009888" value="0x521F4924" />
+        <register type="NOA" address="0x00009888" value="0x541F0024" />
+        <register type="NOA" address="0x00009888" value="0x3A1F8000" />
+        <register type="NOA" address="0x00009888" value="0x4E1F2420" />
+        <register type="NOA" address="0x00009888" value="0x3E1F5000" />
+        <register type="NOA" address="0x00009888" value="0x461F3050" />
+        <register type="NOA" address="0x00009888" value="0x481F2030" />
+        <register type="NOA" address="0x00009888" value="0x4A1F0020" />
+        <register type="NOA" address="0x00009888" value="0x4C1F2000" />
+        <register type="NOA" address="0x00009888" value="0x181F0000" />
+        <register type="NOA" address="0x00009888" value="0x401F0000" />
+        <register type="NOA" address="0x00009888" value="0x421F5050" />
+        <register type="NOA" address="0x00009888" value="0x441F3030" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+    </register_config>
+  </set>
+
+  <set name="Gpu Rings Busyness"
+       mdapi_supported_apis="VK OGL OCL MEDIA IO BB"
+       underscore_name="gpu_busyness"
+       hw_config_guid="40dc79f2-88c8-47c6-8f86-f509e39fbe5d"
+       chipset="ICL"
+       symbol_name="GpuBusyness"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="Vebox Ring Busy"
+             description="The percentage of time when vebox command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vebox_busy"
+             units="percent"
+             symbol_name="VeboxBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Render Ring Busy"
+             description="The percentage of time when render command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="render_busy"
+             units="percent"
+             symbol_name="RenderBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Vdbox0 Ring Busy"
+             description="The percentage of time when Vdbox0 command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vdbox0_busy"
+             units="percent"
+             symbol_name="Vdbox0Busy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Posh Ring Busy"
+             description="The percentage of time when posh command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="posh_engine_busy"
+             units="percent"
+             symbol_name="PoshEngineBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Blitter Ring Busy"
+             description="The percentage of time when blitter command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="blitter_busy"
+             units="percent"
+             symbol_name="BlitterBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Vdbox1 Ring Busy"
+             description="The percentage of time when Vdbox1 command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vdbox1_busy"
+             units="percent"
+             symbol_name="Vdbox1Busy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="AnyRingBusy"
+             description="The percentage of time when any command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="any_ring_busy"
+             units="percent"
+             symbol_name="AnyRingBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009840" value="0x00000000" />
+        <register type="NOA" address="0x00009884" value="0x00000003" />
+        <register type="NOA" address="0x00009888" value="0x0E061200" />
+        <register type="NOA" address="0x00009888" value="0x22062400" />
+        <register type="NOA" address="0x00009888" value="0x10002400" />
+        <register type="NOA" address="0x00009888" value="0x00038000" />
+        <register type="NOA" address="0x00009888" value="0x06032000" />
+        <register type="NOA" address="0x00009888" value="0x020600F3" />
+        <register type="NOA" address="0x00009888" value="0x0C060043" />
+        <register type="NOA" address="0x00009888" value="0x20060000" />
+        <register type="NOA" address="0x00009888" value="0x02000023" />
+        <register type="NOA" address="0x00009888" value="0x20002000" />
+        <register type="NOA" address="0x00009888" value="0x081A8000" />
+        <register type="NOA" address="0x00009888" value="0x3A1F6000" />
+        <register type="NOA" address="0x00009888" value="0x4E1F2900" />
+        <register type="NOA" address="0x00009888" value="0x501F00E9" />
+        <register type="NOA" address="0x00009888" value="0x10204000" />
+        <register type="NOA" address="0x00009888" value="0x0C214000" />
+        <register type="NOA" address="0x00009888" value="0x181F0000" />
+        <register type="NOA" address="0x00009888" value="0x401F4131" />
+        <register type="NOA" address="0x00009888" value="0x421F1021" />
+        <register type="NOA" address="0x00009888" value="0x441F3100" />
+        <register type="NOA" address="0x00009888" value="0x301F0000" />
+        <register type="NOA" address="0x00009884" value="0x00000002" />
+        <register type="NOA" address="0x00009888" value="0x181B2400" />
+        <register type="NOA" address="0x00009888" value="0x185B2400" />
+        <register type="NOA" address="0x00009888" value="0x12240120" />
+        <register type="NOA" address="0x00009888" value="0x06218000" />
+        <register type="NOA" address="0x00009888" value="0x08212000" />
+        <register type="NOA" address="0x00009888" value="0x0A0A8000" />
+        <register type="NOA" address="0x00009888" value="0x180B8000" />
+        <register type="NOA" address="0x00009888" value="0x0A0C8000" />
+        <register type="NOA" address="0x00009888" value="0x040F8000" />
+        <register type="NOA" address="0x00009888" value="0x0E080010" />
+        <register type="NOA" address="0x00009888" value="0x041B8300" />
+        <register type="NOA" address="0x00009888" value="0x101B0000" />
+        <register type="NOA" address="0x00009888" value="0x221B0000" />
+        <register type="NOA" address="0x00009888" value="0x041E4000" />
+        <register type="NOA" address="0x00009888" value="0x084A8000" />
+        <register type="NOA" address="0x00009888" value="0x184B4000" />
+        <register type="NOA" address="0x00009888" value="0x084C8000" />
+        <register type="NOA" address="0x00009888" value="0x044F2000" />
+        <register type="NOA" address="0x00009888" value="0x0E480004" />
+        <register type="NOA" address="0x00009888" value="0x045B0083" />
+        <register type="NOA" address="0x00009888" value="0x105B0000" />
+        <register type="NOA" address="0x00009888" value="0x225B0000" />
+        <register type="NOA" address="0x00009888" value="0x045E1000" />
+        <register type="NOA" address="0x00009888" value="0x0823A000" />
+        <register type="NOA" address="0x00009888" value="0x02242980" />
+        <register type="NOA" address="0x00009888" value="0x10240000" />
+        <register type="NOA" address="0x00009888" value="0x06240000" />
+        <register type="NOA" address="0x00009888" value="0x0A244000" />
+        <register type="NOA" address="0x00009888" value="0x1C250004" />
+        <register type="NOA" address="0x00009888" value="0x08268000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x10800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x0007C000" />
+        <register type="OA" address="0x00002774" value="0x000007FF" />
+    </register_config>
+  </set>
+
+  <set name="Metric set TestOa"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="test_oa"
+       hw_config_guid="3c0bf614-5d67-4326-887f-a24eb8a58244"
+       chipset="ICL"
+       symbol_name="TestOa"
+       >
+    <counter name="TestCounter7"
+             description="HW test counter 7. Factor: 0.6666"
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="counter7"
+             units="events"
+             symbol_name="Counter7"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="TestCounter8"
+             description="HW test counter 8. Should be equal to 1."
+             data_type="uint64"
+             equation="C 0 READ"
+             underscore_name="counter8"
+             units="events"
+             symbol_name="Counter8"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter4"
+             description="HW test counter 4. Factor: 0.3333"
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="counter4"
+             units="events"
+             symbol_name="Counter4"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter5"
+             description="HW test counter 5. Factor: 0.3333"
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="counter5"
+             units="events"
+             symbol_name="Counter5"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter6"
+             description="HW test counter 6. Factor: 0.16666"
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="counter6"
+             units="events"
+             symbol_name="Counter6"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter3"
+             description="HW test counter 3. Factor: 0.5"
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="counter3"
+             units="events"
+             symbol_name="Counter3"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter0"
+             description="HW test counter 0. Factor: 0.0"
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="counter0"
+             units="events"
+             symbol_name="Counter0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter1"
+             description="HW test counter 1. Factor: 1.0"
+             data_type="uint64"
+             equation="B 1 READ"
+             underscore_name="counter1"
+             units="events"
+             symbol_name="Counter1"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter2"
+             description="HW test counter 2. Factor: 1.0"
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="counter2"
+             units="events"
+             symbol_name="Counter2"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009840" value="0x00000000" />
+        <register type="NOA" address="0x00009884" value="0x00000003" />
+        <register type="NOA" address="0x00009888" value="0x16130000" />
+        <register type="NOA" address="0x00009888" value="0x24000001" />
+        <register type="NOA" address="0x00009888" value="0x0E130056" />
+        <register type="NOA" address="0x00009888" value="0x10130000" />
+        <register type="NOA" address="0x00009888" value="0x1A130000" />
+        <register type="NOA" address="0x00009888" value="0x541F0001" />
+        <register type="NOA" address="0x00009888" value="0x181F0000" />
+        <register type="NOA" address="0x00009888" value="0x4C1F0000" />
+        <register type="NOA" address="0x00009888" value="0x301F0000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002770" value="0x00000004" />
+        <register type="OA" address="0x00002774" value="0x0000FFFF" />
+        <register type="OA" address="0x00002778" value="0x00000003" />
+        <register type="OA" address="0x0000277C" value="0x0000FFFF" />
+        <register type="OA" address="0x00002780" value="0x00000007" />
+        <register type="OA" address="0x00002784" value="0x0000FFFF" />
+        <register type="OA" address="0x00002788" value="0x00100002" />
+        <register type="OA" address="0x0000278C" value="0x0000FFF7" />
+        <register type="OA" address="0x00002790" value="0x00100002" />
+        <register type="OA" address="0x00002794" value="0x0000FFCF" />
+        <register type="OA" address="0x00002798" value="0x00100082" />
+        <register type="OA" address="0x0000279C" value="0x0000FFEF" />
+        <register type="OA" address="0x000027A0" value="0x001000C2" />
+        <register type="OA" address="0x000027A4" value="0x0000FFE7" />
+        <register type="OA" address="0x000027A8" value="0x00100001" />
+        <register type="OA" address="0x000027AC" value="0x0000FFE7" />
+    </register_config>
+  </set>
+
+</metrics>
diff --git a/lib/i915/perf-configs/oa-kblgt2.xml b/lib/i915/perf-configs/oa-kblgt2.xml
new file mode 100644
index 00000000..4f667e48
--- /dev/null
+++ b/lib/i915/perf-configs/oa-kblgt2.xml
@@ -0,0 +1,10866 @@
+<?xml version="1.0"?>
+<metrics version="1581935519" merge_md5="">
+  <set name="Render Metrics Basic Gen9"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="render_basic"
+       hw_config_guid="99c1a40e-a090-4354-86e3-4d068bb1917e"
+       chipset="KBLGT2"
+       symbol_name="RenderBasic"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Misses"
+             description="The total number of L3 misses."
+             data_type="uint64"
+             equation="C 4 READ"
+             underscore_name="l3_misses"
+             units="messages"
+             symbol_name="L3Misses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/TAG"
+             />
+    <counter name="GTI L3 Throughput"
+             description="The total number of GPU memory bytes transferred between L3 caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="$L3Misses 64 UMUL"
+             underscore_name="gti_l3_throughput"
+             units="bytes"
+             symbol_name="GtiL3Throughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Cache Misses"
+             description="The total number of sampler cache misses in all LODs in all sampler units."
+             data_type="uint64"
+             equation="B 4 READ 8 UMUL"
+             underscore_name="sampler_l1_misses"
+             units="messages"
+             symbol_name="SamplerL1Misses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler 1 Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which Sampler 1 has been slowing down the pipe when processing EU requests."
+             data_type="float"
+             high_watermark="15"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="sampler1_bottleneck"
+             units="percent"
+             symbol_name="Sampler1Bottleneck"
+             availability="$SubsliceMask 0x12 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="L3 Sampler Throughput"
+             description="The total number of GPU memory bytes transferred between samplers and L3 caches."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="$SamplerL1Misses 64 UMUL"
+             underscore_name="l3_sampler_throughput"
+             units="bytes"
+             symbol_name="L3SamplerThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Sampler"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Sampler 0 Busy"
+             description="The percentage of time in which Sampler 0 has been processing EU requests."
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler0_busy"
+             units="percent"
+             symbol_name="Sampler0Busy"
+             availability="$SubsliceMask 0x09 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Sampler 1 Busy"
+             description="The percentage of time in which Sampler 1 has been processing EU requests."
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler1_busy"
+             units="percent"
+             symbol_name="Sampler1Busy"
+             availability="$SubsliceMask 0x12 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Samplers Busy"
+             description="The percentage of time in which samplers have been processing EU requests."
+             data_type="float"
+             max_equation="100"
+             equation="$Sampler0Busy $Sampler1Busy FMAX"
+             underscore_name="samplers_busy"
+             units="percent"
+             symbol_name="SamplersBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="GTI Fixed Pipe Throughput"
+             description="The total number of GPU memory bytes transferred between 3D Pipeline (Command Dispatch, Input Assembly and Stream Output) and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="B 6 READ B 7 READ UADD 64 UMUL"
+             underscore_name="gti_vf_throughput"
+             units="bytes"
+             symbol_name="GtiVfThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/3D Pipe"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler 0 Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which Sampler 0 has been slowing down the pipe when processing EU requests."
+             data_type="float"
+             high_watermark="15"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="sampler0_bottleneck"
+             units="percent"
+             symbol_name="Sampler0Bottleneck"
+             availability="$SubsliceMask 0x09 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="L3 Lookup Accesses w/o IC"
+             description="The total number of L3 cache lookup accesses w/o IC."
+             data_type="uint64"
+             equation="$SamplerL1Misses $ShaderMemoryAccesses UADD"
+             underscore_name="l3_lookups"
+             units="messages"
+             symbol_name="L3Lookups"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/TAG"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Read Throughput"
+             description="The total number of GPU memory bytes read from GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="C 6 READ 64 UMUL"
+             underscore_name="gti_read_throughput"
+             units="bytes"
+             symbol_name="GtiReadThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Depth Throughput"
+             description="The total number of GPU memory bytes transferred between depth caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 0 READ C 1 READ UADD 64 UMUL"
+             underscore_name="gti_depth_throughput"
+             units="bytes"
+             symbol_name="GtiDepthThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/Depth Cache"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Samplers Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which samplers have been slowing down the pipe when processing EU requests."
+             data_type="float"
+             high_watermark="15"
+             equation="$Sampler0Bottleneck $Sampler1Bottleneck FMAX"
+             max_equation="100"
+             underscore_name="sampler_bottleneck"
+             units="percent"
+             symbol_name="SamplerBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Indicate System Frame Batch Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="GTI HDC TLB Lookup Throughput"
+             description="The total number of GPU memory bytes transferred between GTI and HDC, when HDC is doing TLB lookups."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 5 READ 64 UMUL"
+             underscore_name="gti_hdc_lookups_throughput"
+             units="bytes"
+             symbol_name="GtiHdcLookupsThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI RCC Throughput"
+             description="The total number of GPU memory bytes transferred between render color caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 2 READ C 3 READ UADD 64 UMUL"
+             underscore_name="gti_rcc_throughput"
+             units="bytes"
+             symbol_name="GtiRccThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/Color Cache"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="GTI Write Throughput"
+             description="The total number of GPU memory bytes written to GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 32 UMUL"
+             equation="C 7 READ 64 UMUL"
+             underscore_name="gti_write_throughput"
+             units="bytes"
+             symbol_name="GtiWriteThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x166C01E0" />
+        <register type="NOA" address="0x00009888" value="0x12170280" />
+        <register type="NOA" address="0x00009888" value="0x12370280" />
+        <register type="NOA" address="0x00009888" value="0x11930317" />
+        <register type="NOA" address="0x00009888" value="0x159303DF" />
+        <register type="NOA" address="0x00009888" value="0x3F900003" />
+        <register type="NOA" address="0x00009888" value="0x1A4E0080" />
+        <register type="NOA" address="0x00009888" value="0x0A6C0053" />
+        <register type="NOA" address="0x00009888" value="0x106C0000" />
+        <register type="NOA" address="0x00009888" value="0x1C6C0000" />
+        <register type="NOA" address="0x00009888" value="0x0A1B4000" />
+        <register type="NOA" address="0x00009888" value="0x1C1C0001" />
+        <register type="NOA" address="0x00009888" value="0x002F1000" />
+        <register type="NOA" address="0x00009888" value="0x042F1000" />
+        <register type="NOA" address="0x00009888" value="0x004C4000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C8400" />
+        <register type="NOA" address="0x00009888" value="0x000D2000" />
+        <register type="NOA" address="0x00009888" value="0x060D8000" />
+        <register type="NOA" address="0x00009888" value="0x080DA000" />
+        <register type="NOA" address="0x00009888" value="0x0A0D2000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F0400" />
+        <register type="NOA" address="0x00009888" value="0x0E0F6600" />
+        <register type="NOA" address="0x00009888" value="0x002C8000" />
+        <register type="NOA" address="0x00009888" value="0x162C2200" />
+        <register type="NOA" address="0x00009888" value="0x062D8000" />
+        <register type="NOA" address="0x00009888" value="0x082D8000" />
+        <register type="NOA" address="0x00009888" value="0x00133000" />
+        <register type="NOA" address="0x00009888" value="0x08133000" />
+        <register type="NOA" address="0x00009888" value="0x00170020" />
+        <register type="NOA" address="0x00009888" value="0x08170021" />
+        <register type="NOA" address="0x00009888" value="0x10170000" />
+        <register type="NOA" address="0x00009888" value="0x0633C000" />
+        <register type="NOA" address="0x00009888" value="0x0833C000" />
+        <register type="NOA" address="0x00009888" value="0x06370800" />
+        <register type="NOA" address="0x00009888" value="0x08370840" />
+        <register type="NOA" address="0x00009888" value="0x10370000" />
+        <register type="NOA" address="0x00009888" value="0x0D933031" />
+        <register type="NOA" address="0x00009888" value="0x0F933E3F" />
+        <register type="NOA" address="0x00009888" value="0x01933D00" />
+        <register type="NOA" address="0x00009888" value="0x0393073C" />
+        <register type="NOA" address="0x00009888" value="0x0593000E" />
+        <register type="NOA" address="0x00009888" value="0x1D930000" />
+        <register type="NOA" address="0x00009888" value="0x19930000" />
+        <register type="NOA" address="0x00009888" value="0x1B930000" />
+        <register type="NOA" address="0x00009888" value="0x1D900157" />
+        <register type="NOA" address="0x00009888" value="0x1F900158" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x2B908000" />
+        <register type="NOA" address="0x00009888" value="0x2D908000" />
+        <register type="NOA" address="0x00009888" value="0x2F908000" />
+        <register type="NOA" address="0x00009888" value="0x31908000" />
+        <register type="NOA" address="0x00009888" value="0x15908000" />
+        <register type="NOA" address="0x00009888" value="0x17908000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B908000" />
+        <register type="NOA" address="0x00009888" value="0x1190001F" />
+        <register type="NOA" address="0x00009888" value="0x51904400" />
+        <register type="NOA" address="0x00009888" value="0x41900020" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900C21" />
+        <register type="NOA" address="0x00009888" value="0x47900061" />
+        <register type="NOA" address="0x00009888" value="0x57904440" />
+        <register type="NOA" address="0x00009888" value="0x49900000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900000" />
+        <register type="NOA" address="0x00009888" value="0x59900004" />
+        <register type="NOA" address="0x00009888" value="0x43900000" />
+        <register type="NOA" address="0x00009888" value="0x53904444" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00222222" />
+    </register_config>
+  </set>
+
+  <set name="Compute Metrics Basic Gen9"
+       mdapi_supported_apis="VK OGL4 OCL IO BB"
+       underscore_name="compute_basic"
+       hw_config_guid="12994724-3a5a-4303-bb3c-ba0175d2c200"
+       chipset="KBLGT2"
+       symbol_name="ComputeBasic"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Untyped Bytes Read"
+             description="The total number of typed memory bytes read via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="B 6 READ B 7 READ C 0 READ UADD UADD $EuSlicesTotalCount 64 UMUL UMUL"
+             underscore_name="untyped_bytes_read"
+             units="bytes"
+             symbol_name="UntypedBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Typed Bytes Written"
+             description="The total number of untyped memory bytes written via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="B 3 READ B 4 READ B 5 READ UADD UADD $EuSlicesTotalCount 64 UMUL UMUL"
+             underscore_name="typed_bytes_written"
+             units="bytes"
+             symbol_name="TypedBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu0_active"
+             units="percent"
+             symbol_name="Fpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active"
+             units="percent"
+             symbol_name="Fpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU AVG IPC Rate"
+             description="The average rate of IPC calculated for 2 FPU pipelines."
+             data_type="float"
+             max_equation="2"
+             equation="A 9 READ  A 10 READ  A 11 READ UADD  A 9 READ USUB FDIV 1 FADD"
+             underscore_name="eu_avg_ipc_rate"
+             units="number"
+             symbol_name="EuAvgIpcRate"
+             semantic_type="ratio"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Read Throughput"
+             description="The total number of GPU memory bytes read from GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 4 READ 64 UMUL"
+             underscore_name="gti_read_throughput"
+             units="bytes"
+             symbol_name="GtiReadThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Untyped Writes"
+             description="The total number of untyped memory bytes written via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 1 READ C 2 READ C 3 READ UADD UADD $EuSlicesTotalCount 64 UMUL UMUL"
+             underscore_name="untyped_bytes_written"
+             units="bytes"
+             symbol_name="UntypedBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="Typed Bytes Read"
+             description="The total number of typed memory bytes read via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="B 0 READ B 1 READ B 2 READ UADD UADD $EuSlicesTotalCount 64 UMUL UMUL"
+             underscore_name="typed_bytes_read"
+             units="bytes"
+             symbol_name="TypedBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="EU Thread Occupancy"
+             description="The percentage of time in which hardware threads occupied EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ 8 UMUL $EuCoresTotalCount UDIV $EuThreadsCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_thread_occupancy"
+             units="percent"
+             symbol_name="EuThreadOccupancy"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="GTI Write Throughput"
+             description="The total number of GPU memory bytes written to GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 32 UMUL"
+             equation="C 5 READ 64 UMUL"
+             underscore_name="gti_write_throughput"
+             units="bytes"
+             symbol_name="GtiWriteThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="EU Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_send_active"
+             units="percent"
+             symbol_name="EuSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x104F00E0" />
+        <register type="NOA" address="0x00009888" value="0x124F1C00" />
+        <register type="NOA" address="0x00009888" value="0x106C00E0" />
+        <register type="NOA" address="0x00009888" value="0x37906800" />
+        <register type="NOA" address="0x00009888" value="0x3F900003" />
+        <register type="NOA" address="0x00009888" value="0x004E8000" />
+        <register type="NOA" address="0x00009888" value="0x1A4E0820" />
+        <register type="NOA" address="0x00009888" value="0x1C4E0002" />
+        <register type="NOA" address="0x00009888" value="0x064F0900" />
+        <register type="NOA" address="0x00009888" value="0x084F0032" />
+        <register type="NOA" address="0x00009888" value="0x0A4F1891" />
+        <register type="NOA" address="0x00009888" value="0x0C4F0E00" />
+        <register type="NOA" address="0x00009888" value="0x0E4F003C" />
+        <register type="NOA" address="0x00009888" value="0x004F0D80" />
+        <register type="NOA" address="0x00009888" value="0x024F003B" />
+        <register type="NOA" address="0x00009888" value="0x006C0002" />
+        <register type="NOA" address="0x00009888" value="0x086C0100" />
+        <register type="NOA" address="0x00009888" value="0x0C6C000C" />
+        <register type="NOA" address="0x00009888" value="0x0E6C0B00" />
+        <register type="NOA" address="0x00009888" value="0x186C0000" />
+        <register type="NOA" address="0x00009888" value="0x1C6C0000" />
+        <register type="NOA" address="0x00009888" value="0x1E6C0000" />
+        <register type="NOA" address="0x00009888" value="0x001B4000" />
+        <register type="NOA" address="0x00009888" value="0x081B8000" />
+        <register type="NOA" address="0x00009888" value="0x0C1B4000" />
+        <register type="NOA" address="0x00009888" value="0x0E1B8000" />
+        <register type="NOA" address="0x00009888" value="0x101C8000" />
+        <register type="NOA" address="0x00009888" value="0x1A1C8000" />
+        <register type="NOA" address="0x00009888" value="0x1C1C0024" />
+        <register type="NOA" address="0x00009888" value="0x065B8000" />
+        <register type="NOA" address="0x00009888" value="0x085B4000" />
+        <register type="NOA" address="0x00009888" value="0x0A5BC000" />
+        <register type="NOA" address="0x00009888" value="0x0C5B8000" />
+        <register type="NOA" address="0x00009888" value="0x0E5B4000" />
+        <register type="NOA" address="0x00009888" value="0x005B8000" />
+        <register type="NOA" address="0x00009888" value="0x025B4000" />
+        <register type="NOA" address="0x00009888" value="0x1A5C6000" />
+        <register type="NOA" address="0x00009888" value="0x1C5C001B" />
+        <register type="NOA" address="0x00009888" value="0x125C8000" />
+        <register type="NOA" address="0x00009888" value="0x145C8000" />
+        <register type="NOA" address="0x00009888" value="0x004C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C2000" />
+        <register type="NOA" address="0x00009888" value="0x0C4C0208" />
+        <register type="NOA" address="0x00009888" value="0x000DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D8000" />
+        <register type="NOA" address="0x00009888" value="0x080DA000" />
+        <register type="NOA" address="0x00009888" value="0x0A0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0E0DA000" />
+        <register type="NOA" address="0x00009888" value="0x020D2000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F5400" />
+        <register type="NOA" address="0x00009888" value="0x0E0F5500" />
+        <register type="NOA" address="0x00009888" value="0x100F0155" />
+        <register type="NOA" address="0x00009888" value="0x002C8000" />
+        <register type="NOA" address="0x00009888" value="0x0E2CC000" />
+        <register type="NOA" address="0x00009888" value="0x162CFB00" />
+        <register type="NOA" address="0x00009888" value="0x182C00BE" />
+        <register type="NOA" address="0x00009888" value="0x022CC000" />
+        <register type="NOA" address="0x00009888" value="0x042CC000" />
+        <register type="NOA" address="0x00009888" value="0x19900157" />
+        <register type="NOA" address="0x00009888" value="0x1B900158" />
+        <register type="NOA" address="0x00009888" value="0x1D900105" />
+        <register type="NOA" address="0x00009888" value="0x1F900103" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x11900FFF" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900800" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900821" />
+        <register type="NOA" address="0x00009888" value="0x47900802" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900802" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900002" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x43900422" />
+        <register type="NOA" address="0x00009888" value="0x53904444" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00000003" />
+        <register type="FLEX" address="0x0000E658" value="0x00002001" />
+        <register type="FLEX" address="0x0000E758" value="0x00778008" />
+        <register type="FLEX" address="0x0000E45C" value="0x00088078" />
+        <register type="FLEX" address="0x0000E55C" value="0x00808708" />
+        <register type="FLEX" address="0x0000E65C" value="0x00222222" />
+    </register_config>
+  </set>
+
+  <set name="Render Metrics for 3D Pipeline Profile Gen9"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="render_pipe_profile"
+       hw_config_guid="d7a17a3a-ca71-40d2-a919-ace80d50633f"
+       chipset="KBLGT2"
+       symbol_name="RenderPipeProfile"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Bottleneck"
+             low_watermark="10"
+             description="The percentage of time in which vertex shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="30"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_bottleneck"
+             units="percent"
+             symbol_name="VsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Hi-Depth Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which early hierarchical depth test pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="hi_depth_bottleneck"
+             units="percent"
+             symbol_name="HiDepthBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which geometry shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gs_bottleneck"
+             units="percent"
+             symbol_name="GsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Geometry Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="BC Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which barycentric coordinates calculation pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="bc_bottleneck"
+             units="percent"
+             symbol_name="BcBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Barycentric Calc"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HS Stall"
+             description="The percentage of time in which hull stall pipeline stage was stalled."
+             data_type="float"
+             equation="C 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="hs_stall"
+             units="percent"
+             symbol_name="HsStall"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Hull Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="VF Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which vertex fetch pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="C 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vf_bottleneck"
+             units="percent"
+             symbol_name="VfBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Input Assembler"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Strip-Fans Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which strip-fans pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="10"
+             equation="B 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sf_bottleneck"
+             units="percent"
+             symbol_name="SfBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Strip-Fans"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SF Stall"
+             description="The percentage of time in which strip-fans pipeline stage was stalled."
+             data_type="float"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sf_stall"
+             units="percent"
+             symbol_name="SfStall"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Strip-Fans"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HS Bottleneck"
+             low_watermark="3"
+             description="The percentage of time in which hull shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="9"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="hs_bottleneck"
+             units="percent"
+             symbol_name="HsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Hull Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="CL Stall"
+             description="The percentage of time in which clipper pipeline stage was stalled."
+             data_type="float"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="cl_stall"
+             units="percent"
+             symbol_name="ClStall"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Clipper"
+             />
+    <counter name="SO Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which stream output pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="so_bottleneck"
+             units="percent"
+             symbol_name="SoBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Stream Output"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="DS Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which domain shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ds_bottleneck"
+             units="percent"
+             symbol_name="DsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Domain Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Clipper Bottleneck"
+             low_watermark="10"
+             description="The percentage of time in which clipper pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="30"
+             equation="B 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="cl_bottleneck"
+             units="percent"
+             symbol_name="ClBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Clipper"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Stall"
+             description="The percentage of time in which domain shader pipeline stage was stalled."
+             data_type="float"
+             equation="C 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ds_stall"
+             units="percent"
+             symbol_name="DsStall"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Domain Shader"
+             />
+    <counter name="Early Depth Bottleneck"
+             low_watermark="10"
+             description="The percentage of time in which early depth test pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="30"
+             equation="B 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="early_depth_bottleneck"
+             units="percent"
+             symbol_name="EarlyDepthBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="SO Stall"
+             description="The percentage of time in which stream-output pipeline stage was stalled."
+             data_type="float"
+             equation="C 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="so_stall"
+             units="percent"
+             symbol_name="SoStall"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Stream Output"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x0C0E001F" />
+        <register type="NOA" address="0x00009888" value="0x0A0F0000" />
+        <register type="NOA" address="0x00009888" value="0x10116800" />
+        <register type="NOA" address="0x00009888" value="0x178A03E0" />
+        <register type="NOA" address="0x00009888" value="0x11824C00" />
+        <register type="NOA" address="0x00009888" value="0x11830020" />
+        <register type="NOA" address="0x00009888" value="0x13840020" />
+        <register type="NOA" address="0x00009888" value="0x11850019" />
+        <register type="NOA" address="0x00009888" value="0x11860007" />
+        <register type="NOA" address="0x00009888" value="0x01870C40" />
+        <register type="NOA" address="0x00009888" value="0x17880000" />
+        <register type="NOA" address="0x00009888" value="0x022F4000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C0040" />
+        <register type="NOA" address="0x00009888" value="0x0C0D8000" />
+        <register type="NOA" address="0x00009888" value="0x040D4000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x020E5400" />
+        <register type="NOA" address="0x00009888" value="0x000E0000" />
+        <register type="NOA" address="0x00009888" value="0x080F0040" />
+        <register type="NOA" address="0x00009888" value="0x000F0000" />
+        <register type="NOA" address="0x00009888" value="0x100F0000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0040" />
+        <register type="NOA" address="0x00009888" value="0x0C2C8000" />
+        <register type="NOA" address="0x00009888" value="0x06104000" />
+        <register type="NOA" address="0x00009888" value="0x06110012" />
+        <register type="NOA" address="0x00009888" value="0x06131000" />
+        <register type="NOA" address="0x00009888" value="0x01898000" />
+        <register type="NOA" address="0x00009888" value="0x0D890100" />
+        <register type="NOA" address="0x00009888" value="0x03898000" />
+        <register type="NOA" address="0x00009888" value="0x09808000" />
+        <register type="NOA" address="0x00009888" value="0x0B808000" />
+        <register type="NOA" address="0x00009888" value="0x0380C000" />
+        <register type="NOA" address="0x00009888" value="0x0F8A0075" />
+        <register type="NOA" address="0x00009888" value="0x1D8A0000" />
+        <register type="NOA" address="0x00009888" value="0x118A8000" />
+        <register type="NOA" address="0x00009888" value="0x1B8A4000" />
+        <register type="NOA" address="0x00009888" value="0x138A8000" />
+        <register type="NOA" address="0x00009888" value="0x1D81A000" />
+        <register type="NOA" address="0x00009888" value="0x15818000" />
+        <register type="NOA" address="0x00009888" value="0x17818000" />
+        <register type="NOA" address="0x00009888" value="0x0B820030" />
+        <register type="NOA" address="0x00009888" value="0x07828000" />
+        <register type="NOA" address="0x00009888" value="0x0D824000" />
+        <register type="NOA" address="0x00009888" value="0x0F828000" />
+        <register type="NOA" address="0x00009888" value="0x05824000" />
+        <register type="NOA" address="0x00009888" value="0x0D830003" />
+        <register type="NOA" address="0x00009888" value="0x0583000C" />
+        <register type="NOA" address="0x00009888" value="0x09830000" />
+        <register type="NOA" address="0x00009888" value="0x03838000" />
+        <register type="NOA" address="0x00009888" value="0x07838000" />
+        <register type="NOA" address="0x00009888" value="0x0B840980" />
+        <register type="NOA" address="0x00009888" value="0x03844D80" />
+        <register type="NOA" address="0x00009888" value="0x11840000" />
+        <register type="NOA" address="0x00009888" value="0x09848000" />
+        <register type="NOA" address="0x00009888" value="0x09850080" />
+        <register type="NOA" address="0x00009888" value="0x03850003" />
+        <register type="NOA" address="0x00009888" value="0x01850000" />
+        <register type="NOA" address="0x00009888" value="0x07860000" />
+        <register type="NOA" address="0x00009888" value="0x0F860400" />
+        <register type="NOA" address="0x00009888" value="0x09870032" />
+        <register type="NOA" address="0x00009888" value="0x01888052" />
+        <register type="NOA" address="0x00009888" value="0x11880000" />
+        <register type="NOA" address="0x00009888" value="0x09884000" />
+        <register type="NOA" address="0x00009888" value="0x1B931001" />
+        <register type="NOA" address="0x00009888" value="0x1D930001" />
+        <register type="NOA" address="0x00009888" value="0x19934000" />
+        <register type="NOA" address="0x00009888" value="0x1B958000" />
+        <register type="NOA" address="0x00009888" value="0x1D950094" />
+        <register type="NOA" address="0x00009888" value="0x19958000" />
+        <register type="NOA" address="0x00009888" value="0x09E58000" />
+        <register type="NOA" address="0x00009888" value="0x0BE58000" />
+        <register type="NOA" address="0x00009888" value="0x03E5C000" />
+        <register type="NOA" address="0x00009888" value="0x0592C000" />
+        <register type="NOA" address="0x00009888" value="0x0B928000" />
+        <register type="NOA" address="0x00009888" value="0x0D924000" />
+        <register type="NOA" address="0x00009888" value="0x0F924000" />
+        <register type="NOA" address="0x00009888" value="0x11928000" />
+        <register type="NOA" address="0x00009888" value="0x1392C000" />
+        <register type="NOA" address="0x00009888" value="0x09924000" />
+        <register type="NOA" address="0x00009888" value="0x01985000" />
+        <register type="NOA" address="0x00009888" value="0x07988000" />
+        <register type="NOA" address="0x00009888" value="0x09981000" />
+        <register type="NOA" address="0x00009888" value="0x0B982000" />
+        <register type="NOA" address="0x00009888" value="0x0D982000" />
+        <register type="NOA" address="0x00009888" value="0x0F989000" />
+        <register type="NOA" address="0x00009888" value="0x05982000" />
+        <register type="NOA" address="0x00009888" value="0x13904000" />
+        <register type="NOA" address="0x00009888" value="0x21904000" />
+        <register type="NOA" address="0x00009888" value="0x23904000" />
+        <register type="NOA" address="0x00009888" value="0x25908000" />
+        <register type="NOA" address="0x00009888" value="0x27904000" />
+        <register type="NOA" address="0x00009888" value="0x29908000" />
+        <register type="NOA" address="0x00009888" value="0x2B904000" />
+        <register type="NOA" address="0x00009888" value="0x2F904000" />
+        <register type="NOA" address="0x00009888" value="0x31904000" />
+        <register type="NOA" address="0x00009888" value="0x15904000" />
+        <register type="NOA" address="0x00009888" value="0x17908000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B904000" />
+        <register type="NOA" address="0x00009888" value="0x1190C080" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900440" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900400" />
+        <register type="NOA" address="0x00009888" value="0x47900C21" />
+        <register type="NOA" address="0x00009888" value="0x57900400" />
+        <register type="NOA" address="0x00009888" value="0x49900042" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900024" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x43900841" />
+        <register type="NOA" address="0x00009888" value="0x53900400" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007FFEA" />
+        <register type="OA" address="0x00002774" value="0x00007FFC" />
+        <register type="OA" address="0x00002778" value="0x0007AFFA" />
+        <register type="OA" address="0x0000277C" value="0x0000F5FD" />
+        <register type="OA" address="0x00002780" value="0x00079FFA" />
+        <register type="OA" address="0x00002784" value="0x0000F3FB" />
+        <register type="OA" address="0x00002788" value="0x0007BF7A" />
+        <register type="OA" address="0x0000278C" value="0x0000F7E7" />
+        <register type="OA" address="0x00002790" value="0x0007FEFA" />
+        <register type="OA" address="0x00002794" value="0x0000F7CF" />
+        <register type="OA" address="0x00002798" value="0x00077FFA" />
+        <register type="OA" address="0x0000279C" value="0x0000EFDF" />
+        <register type="OA" address="0x000027A0" value="0x0006FFFA" />
+        <register type="OA" address="0x000027A4" value="0x0000CFBF" />
+        <register type="OA" address="0x000027A8" value="0x0003FFFA" />
+        <register type="OA" address="0x000027AC" value="0x00005F7F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00015014" />
+        <register type="FLEX" address="0x0000E658" value="0x00025024" />
+        <register type="FLEX" address="0x0000E758" value="0x00035034" />
+        <register type="FLEX" address="0x0000E45C" value="0x00045044" />
+        <register type="FLEX" address="0x0000E55C" value="0x00055054" />
+        <register type="FLEX" address="0x0000E65C" value="0x00065064" />
+    </register_config>
+  </set>
+
+  <set name="Memory Reads Distribution Gen9"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="memory_reads"
+       hw_config_guid="57b59202-172b-477a-87de-33f85572c589"
+       chipset="KBLGT2"
+       symbol_name="MemoryReads"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiL3Bank0Reads"
+             description="The total number of GTI memory reads from L3 Bank 0 (L3 Cache misses)."
+             data_type="uint64"
+             equation="C 4 READ"
+             underscore_name="gti_l3_bank0_reads"
+             units="messages"
+             symbol_name="GtiL3Bank0Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="GtiRingAccesses"
+             description="The total number of all accesses from GTI to the ring."
+             data_type="uint64"
+             equation="C 3 READ 2 UMUL"
+             underscore_name="gti_ring_accesses"
+             units="messages"
+             symbol_name="GtiRingAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="GtiL3Bank3Reads"
+             description="The total number of GTI memory reads from L3 Bank 3 (L3 Cache misses)."
+             data_type="uint64"
+             equation="C 7 READ"
+             underscore_name="gti_l3_bank3_reads"
+             units="messages"
+             symbol_name="GtiL3Bank3Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="GtiRsMemoryReads"
+             description="The total number of GTI memory reads from Resource Streamer."
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="gti_rs_memory_reads"
+             units="messages"
+             symbol_name="GtiRsMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Resource Streamer"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GtiHizMemoryReads"
+             description="The total number of GTI memory reads from Hierarchical Depth Cache (Hi-Depth Cache misses)."
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="gti_hiz_memory_reads"
+             units="messages"
+             symbol_name="GtiHizMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="GtiRccMemoryReads"
+             description="The total number of GTI memory reads from Render Color Cache (Render Color Cache misses)."
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="gti_rcc_memory_reads"
+             units="messages"
+             symbol_name="GtiRccMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Color Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiL3Bank1Reads"
+             description="The total number of GTI memory reads from L3 Bank 1 (L3 Cache misses)."
+             data_type="uint64"
+             equation="C 5 READ"
+             underscore_name="gti_l3_bank1_reads"
+             units="messages"
+             symbol_name="GtiL3Bank1Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiCmdStreamerMemoryReads"
+             description="The total number of GTI memory reads from Command Streamer."
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="gti_cmd_streamer_memory_reads"
+             units="messages"
+             symbol_name="GtiCmdStreamerMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Command Streamer"
+             />
+    <counter name="GtiL3Bank2Reads"
+             description="The total number of GTI memory reads from L3 Bank 2 (L3 Cache misses)."
+             data_type="uint64"
+             equation="C 6 READ"
+             underscore_name="gti_l3_bank2_reads"
+             units="messages"
+             symbol_name="GtiL3Bank2Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiMemoryReads"
+             description="The total number of GTI memory reads."
+             data_type="uint64"
+             equation="C 0 READ"
+             underscore_name="gti_memory_reads"
+             units="messages"
+             symbol_name="GtiMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="GtiRczMemoryReads"
+             description="The total number of GTI memory reads from Render Depth Cache (Render Depth Cache misses)."
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="gti_rcz_memory_reads"
+             units="messages"
+             symbol_name="GtiRczMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="GtiMscMemoryReads"
+             description="The total number of GTI memory reads from Multisampling Color Cache (Multisampling Color Cache misses)."
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="gti_msc_memory_reads"
+             units="messages"
+             symbol_name="GtiMscMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Color Cache"
+             />
+    <counter name="GtiVfMemoryReads"
+             description="The total number of GTI memory reads from Vertex Fetch."
+             data_type="uint64"
+             equation="B 1 READ"
+             underscore_name="gti_vf_memory_reads"
+             units="messages"
+             symbol_name="GtiVfMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Vertex Fetch"
+             />
+    <counter name="GtiStcMemoryReads"
+             description="The total number of GTI memory reads from Stencil Cache (Stencil Cache misses)."
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="gti_stc_memory_reads"
+             units="messages"
+             symbol_name="GtiStcMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiL3Reads"
+             description="The total number of GTI memory reads from L3 (L3 Cache misses)."
+             data_type="uint64"
+             equation="$GtiL3Bank0Reads $GtiL3Bank1Reads $GtiL3Bank2Reads $GtiL3Bank3Reads UADD UADD UADD"
+             underscore_name="gti_l3_reads"
+             units="messages"
+             symbol_name="GtiL3Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x11810C00" />
+        <register type="NOA" address="0x00009888" value="0x1381001A" />
+        <register type="NOA" address="0x00009888" value="0x37906800" />
+        <register type="NOA" address="0x00009888" value="0x3F900064" />
+        <register type="NOA" address="0x00009888" value="0x03811300" />
+        <register type="NOA" address="0x00009888" value="0x05811B12" />
+        <register type="NOA" address="0x00009888" value="0x0781001A" />
+        <register type="NOA" address="0x00009888" value="0x1F810000" />
+        <register type="NOA" address="0x00009888" value="0x17810000" />
+        <register type="NOA" address="0x00009888" value="0x19810000" />
+        <register type="NOA" address="0x00009888" value="0x1B810000" />
+        <register type="NOA" address="0x00009888" value="0x1D810000" />
+        <register type="NOA" address="0x00009888" value="0x1B930055" />
+        <register type="NOA" address="0x00009888" value="0x03E58000" />
+        <register type="NOA" address="0x00009888" value="0x05E5C000" />
+        <register type="NOA" address="0x00009888" value="0x07E54000" />
+        <register type="NOA" address="0x00009888" value="0x13900150" />
+        <register type="NOA" address="0x00009888" value="0x21900151" />
+        <register type="NOA" address="0x00009888" value="0x23900152" />
+        <register type="NOA" address="0x00009888" value="0x25900153" />
+        <register type="NOA" address="0x00009888" value="0x27900154" />
+        <register type="NOA" address="0x00009888" value="0x29900155" />
+        <register type="NOA" address="0x00009888" value="0x2B900156" />
+        <register type="NOA" address="0x00009888" value="0x2D900157" />
+        <register type="NOA" address="0x00009888" value="0x2F90015F" />
+        <register type="NOA" address="0x00009888" value="0x31900105" />
+        <register type="NOA" address="0x00009888" value="0x15900103" />
+        <register type="NOA" address="0x00009888" value="0x17900101" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B908000" />
+        <register type="NOA" address="0x00009888" value="0x1D908000" />
+        <register type="NOA" address="0x00009888" value="0x1F908000" />
+        <register type="NOA" address="0x00009888" value="0x11900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900C60" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900C00" />
+        <register type="NOA" address="0x00009888" value="0x47900C63" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900C63" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900063" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x43900003" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x0000272C" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002728" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x0000271C" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002718" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x0000274C" value="0x86543210" />
+        <register type="OA" address="0x00002748" value="0x86543210" />
+        <register type="OA" address="0x00002744" value="0x00006667" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x0000275C" value="0x86543210" />
+        <register type="OA" address="0x00002758" value="0x86543210" />
+        <register type="OA" address="0x00002754" value="0x00006465" />
+        <register type="OA" address="0x00002750" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007F81A" />
+        <register type="OA" address="0x00002774" value="0x0000FE00" />
+        <register type="OA" address="0x00002778" value="0x0007F82A" />
+        <register type="OA" address="0x0000277C" value="0x0000FE00" />
+        <register type="OA" address="0x00002780" value="0x0007F872" />
+        <register type="OA" address="0x00002784" value="0x0000FE00" />
+        <register type="OA" address="0x00002788" value="0x0007F8BA" />
+        <register type="OA" address="0x0000278C" value="0x0000FE00" />
+        <register type="OA" address="0x00002790" value="0x0007F87A" />
+        <register type="OA" address="0x00002794" value="0x0000FE00" />
+        <register type="OA" address="0x00002798" value="0x0007F8EA" />
+        <register type="OA" address="0x0000279C" value="0x0000FE00" />
+        <register type="OA" address="0x000027A0" value="0x0007F8E2" />
+        <register type="OA" address="0x000027A4" value="0x0000FE00" />
+        <register type="OA" address="0x000027A8" value="0x0007F8F2" />
+        <register type="OA" address="0x000027AC" value="0x0000FE00" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00015014" />
+        <register type="FLEX" address="0x0000E658" value="0x00025024" />
+        <register type="FLEX" address="0x0000E758" value="0x00035034" />
+        <register type="FLEX" address="0x0000E45C" value="0x00045044" />
+        <register type="FLEX" address="0x0000E55C" value="0x00055054" />
+        <register type="FLEX" address="0x0000E65C" value="0x00065064" />
+    </register_config>
+  </set>
+
+  <set name="Memory Writes Distribution Gen9"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="memory_writes"
+       hw_config_guid="3addf8ef-8e9b-40f5-a448-3dbb5d5128b0"
+       chipset="KBLGT2"
+       symbol_name="MemoryWrites"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiMemoryWrites"
+             description="The total number of GTI memory writes."
+             data_type="uint64"
+             equation="C 0 READ"
+             underscore_name="gti_memory_writes"
+             units="messages"
+             symbol_name="GtiMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="GtiRingAccesses"
+             description="The total number of all GTI accesses to the ring."
+             data_type="uint64"
+             equation="C 3 READ 2 UMUL"
+             underscore_name="gti_ring_accesses"
+             units="messages"
+             symbol_name="GtiRingAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="GtiMscMemoryWrites"
+             description="The total number of GTI memory writes from Multisampling Color Cache (Multisampling Color Cache invalidations)."
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="gti_msc_memory_writes"
+             units="messages"
+             symbol_name="GtiMscMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Color Cache"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="GtiCmdStreamerMemoryWrites"
+             description="The total number of GTI memory writes from Command Streamer."
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="gti_cmd_streamer_memory_writes"
+             units="messages"
+             symbol_name="GtiCmdStreamerMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Command Streamer"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GtiL3Bank0Writes"
+             description="The total number of GTI memory writes from L3 Bank 0 (L3 Bank 0 invalidations)."
+             data_type="uint64"
+             equation="C 4 READ"
+             underscore_name="gti_l3_bank0_writes"
+             units="messages"
+             symbol_name="GtiL3Bank0Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiL3Bank1Writes"
+             description="The total number of GTI memory writes from L3 Bank 1 (L3 Bank 1 invalidations)."
+             data_type="uint64"
+             equation="C 5 READ"
+             underscore_name="gti_l3_bank1_writes"
+             units="messages"
+             symbol_name="GtiL3Bank1Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiL3Bank2Writes"
+             description="The total number of GTI memory writes from L3 Bank 2 (L3 Bank 2 invalidations)."
+             data_type="uint64"
+             equation="C 6 READ"
+             underscore_name="gti_l3_bank2_writes"
+             units="messages"
+             symbol_name="GtiL3Bank2Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiL3Bank3Writes"
+             description="The total number of GTI memory writes from L3 Bank 3 (L3 Bank 3 invalidations)."
+             data_type="uint64"
+             equation="C 7 READ"
+             underscore_name="gti_l3_bank3_writes"
+             units="messages"
+             symbol_name="GtiL3Bank3Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiL3Writes"
+             description="The total number of GTI memory writes from L3 (L3 invalidations)."
+             data_type="uint64"
+             equation="$GtiL3Bank0Writes $GtiL3Bank1Writes $GtiL3Bank2Writes $GtiL3Bank3Writes UADD UADD UADD"
+             underscore_name="gti_l3_writes"
+             units="messages"
+             symbol_name="GtiL3Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiRccMemoryWrites"
+             description="The total number of GTI memory writes from Render Color Cache (Render Color Cache invalidations)."
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="gti_rcc_memory_writes"
+             units="messages"
+             symbol_name="GtiRccMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Color Cache"
+             />
+    <counter name="GtiSoMemoryWrites"
+             description="The total number of GTI memory writes from Stream Output."
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="gti_so_memory_writes"
+             units="messages"
+             symbol_name="GtiSoMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Stream Output"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiStcMemoryWrites"
+             description="The total number of GTI memory writes from Stencil Cache."
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="gti_stc_memory_writes"
+             units="messages"
+             symbol_name="GtiStcMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="GtiRczMemoryWrites"
+             description="The total number of GTI memory writes from Render Depth Cache."
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="gti_rcz_memory_writes"
+             units="messages"
+             symbol_name="GtiRczMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="GtiHizMemoryWrites"
+             description="The total number of GTI memory writes from Hierarchical Depth Cache."
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="gti_hiz_memory_writes"
+             units="messages"
+             symbol_name="GtiHizMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x11810C00" />
+        <register type="NOA" address="0x00009888" value="0x1381001A" />
+        <register type="NOA" address="0x00009888" value="0x37906800" />
+        <register type="NOA" address="0x00009888" value="0x3F901000" />
+        <register type="NOA" address="0x00009888" value="0x03811300" />
+        <register type="NOA" address="0x00009888" value="0x05811B12" />
+        <register type="NOA" address="0x00009888" value="0x0781001A" />
+        <register type="NOA" address="0x00009888" value="0x1F810000" />
+        <register type="NOA" address="0x00009888" value="0x17810000" />
+        <register type="NOA" address="0x00009888" value="0x19810000" />
+        <register type="NOA" address="0x00009888" value="0x1B810000" />
+        <register type="NOA" address="0x00009888" value="0x1D810000" />
+        <register type="NOA" address="0x00009888" value="0x1B930055" />
+        <register type="NOA" address="0x00009888" value="0x03E58000" />
+        <register type="NOA" address="0x00009888" value="0x05E5C000" />
+        <register type="NOA" address="0x00009888" value="0x07E54000" />
+        <register type="NOA" address="0x00009888" value="0x13900160" />
+        <register type="NOA" address="0x00009888" value="0x21900161" />
+        <register type="NOA" address="0x00009888" value="0x23900162" />
+        <register type="NOA" address="0x00009888" value="0x25900163" />
+        <register type="NOA" address="0x00009888" value="0x27900164" />
+        <register type="NOA" address="0x00009888" value="0x29900165" />
+        <register type="NOA" address="0x00009888" value="0x2B900166" />
+        <register type="NOA" address="0x00009888" value="0x2D900167" />
+        <register type="NOA" address="0x00009888" value="0x2F900150" />
+        <register type="NOA" address="0x00009888" value="0x31900105" />
+        <register type="NOA" address="0x00009888" value="0x15900103" />
+        <register type="NOA" address="0x00009888" value="0x17900101" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B908000" />
+        <register type="NOA" address="0x00009888" value="0x1D908000" />
+        <register type="NOA" address="0x00009888" value="0x1F908000" />
+        <register type="NOA" address="0x00009888" value="0x11900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900C60" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900C00" />
+        <register type="NOA" address="0x00009888" value="0x47900C63" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900C63" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900063" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x43900003" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x0000272C" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002728" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x0000271C" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002718" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x0000274C" value="0x86543210" />
+        <register type="OA" address="0x00002748" value="0x86543210" />
+        <register type="OA" address="0x00002744" value="0x00006667" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x0000275C" value="0x86543210" />
+        <register type="OA" address="0x00002758" value="0x86543210" />
+        <register type="OA" address="0x00002754" value="0x00006465" />
+        <register type="OA" address="0x00002750" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007F81A" />
+        <register type="OA" address="0x00002774" value="0x0000FE00" />
+        <register type="OA" address="0x00002778" value="0x0007F82A" />
+        <register type="OA" address="0x0000277C" value="0x0000FE00" />
+        <register type="OA" address="0x00002780" value="0x0007F822" />
+        <register type="OA" address="0x00002784" value="0x0000FE00" />
+        <register type="OA" address="0x00002788" value="0x0007F8BA" />
+        <register type="OA" address="0x0000278C" value="0x0000FE00" />
+        <register type="OA" address="0x00002790" value="0x0007F87A" />
+        <register type="OA" address="0x00002794" value="0x0000FE00" />
+        <register type="OA" address="0x00002798" value="0x0007F8EA" />
+        <register type="OA" address="0x0000279C" value="0x0000FE00" />
+        <register type="OA" address="0x000027A0" value="0x0007F8E2" />
+        <register type="OA" address="0x000027A4" value="0x0000FE00" />
+        <register type="OA" address="0x000027A8" value="0x0007F8F2" />
+        <register type="OA" address="0x000027AC" value="0x0000FE00" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00015014" />
+        <register type="FLEX" address="0x0000E658" value="0x00025024" />
+        <register type="FLEX" address="0x0000E758" value="0x00035034" />
+        <register type="FLEX" address="0x0000E45C" value="0x00045044" />
+        <register type="FLEX" address="0x0000E55C" value="0x00055054" />
+        <register type="FLEX" address="0x0000E65C" value="0x00065064" />
+    </register_config>
+  </set>
+
+  <set name="Compute Metrics Extended Gen9"
+       mdapi_supported_apis="VK OGL4 OCL IO BB"
+       underscore_name="compute_extended"
+       hw_config_guid="4af0400a-81c3-47db-a6b6-deddbd75680e"
+       chipset="KBLGT2"
+       symbol_name="ComputeExtended"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu0_active"
+             units="percent"
+             symbol_name="Fpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active"
+             units="percent"
+             symbol_name="Fpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU AVG IPC Rate"
+             description="The average rate of IPC calculated for 2 FPU pipelines."
+             data_type="float"
+             max_equation="2"
+             equation="A 9 READ  A 10 READ  A 11 READ UADD  A 9 READ USUB FDIV 1 FADD"
+             underscore_name="eu_avg_ipc_rate"
+             units="number"
+             symbol_name="EuAvgIpcRate"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Typed Writes 0"
+             description="The subslice 0 typed writes."
+             data_type="uint64"
+             equation="C 0 READ"
+             underscore_name="typed_writes0"
+             units="messages"
+             symbol_name="TypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuTypedAtomics0"
+             description="The subslice 0 EU Typed Atomics subslice 0."
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="eu_typed_atomics0"
+             units="messages"
+             symbol_name="EuTypedAtomics0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Typed Atomics 0"
+             description="The subslice 0 typed atomics."
+             data_type="uint64"
+             equation="C 4 READ"
+             underscore_name="typed_atomics0"
+             units="messages"
+             symbol_name="TypedAtomics0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="TypedAtomicsPerCacheLine"
+             description="The ratio of EU typed atomics requests to L3 cache line writes."
+             data_type="float"
+             equation="$EuTypedAtomics0 $TypedAtomics0 FDIV"
+             underscore_name="typed_atomics_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="TypedAtomicsPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuUntypedReads0"
+             description="The subslice 0 EU Untyped Reads subslice 0."
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="eu_untyped_reads0"
+             units="messages"
+             symbol_name="EuUntypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Untyped Writes 0"
+             description="The subslice 0 untyped writes (including SLM writes)."
+             data_type="uint64"
+             equation="C 1 READ"
+             underscore_name="untyped_writes0"
+             units="messages"
+             symbol_name="UntypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuUntypedAtomics0"
+             description="The subslice 0 EU Untyped Atomics subslice 0."
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="eu_untyped_atomics0"
+             units="messages"
+             symbol_name="EuUntypedAtomics0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuUntypedWrites0"
+             description="The subslice 0 EU Untyped Writes subslice 0."
+             data_type="uint64"
+             equation="B 1 READ"
+             underscore_name="eu_untyped_writes0"
+             units="messages"
+             symbol_name="EuUntypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuA64UntypedWrites0"
+             description="The subslice 0 EU A64 Untyped Writes subslice 0."
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="eu_a64_untyped_writes0"
+             units="messages"
+             symbol_name="EuA64UntypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="UntypedWritesPerCacheLine"
+             description="The ratio of EU untyped write requests to L3 cache line writes."
+             data_type="float"
+             equation="$EuUntypedWrites0 $EuA64UntypedWrites0 UADD $UntypedWrites0 FDIV"
+             underscore_name="untyped_writes_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="UntypedWritesPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EuTypedWrites0"
+             description="The subslice 0 EU Typed Writes subslice 0."
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="eu_typed_writes0"
+             units="messages"
+             symbol_name="EuTypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="TypedWritesPerCacheLine"
+             description="The ratio of EU typed write requests to L3 cache line writes."
+             data_type="float"
+             equation="$EuTypedWrites0 $TypedWrites0 FDIV"
+             underscore_name="typed_writes_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="TypedWritesPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Typed Reads 0"
+             description="The subslice 0 typed reads."
+             data_type="uint64"
+             equation="C 2 READ"
+             underscore_name="typed_reads0"
+             units="messages"
+             symbol_name="TypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Untyped Reads 0"
+             description="The subslice 0 untyped reads (including SLM reads)."
+             data_type="uint64"
+             equation="C 3 READ"
+             underscore_name="untyped_reads0"
+             units="messages"
+             symbol_name="UntypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuA64UntypedReads0"
+             description="The subslice 0 EU A64 Untyped Reads subslice 0."
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="eu_a64_untyped_reads0"
+             units="messages"
+             symbol_name="EuA64UntypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EU Thread Occupancy"
+             description="The percentage of time in which hardware threads occupied EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ 8 UMUL $EuCoresTotalCount UDIV $EuThreadsCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_thread_occupancy"
+             units="percent"
+             symbol_name="EuThreadOccupancy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EuTypedReads0"
+             description="The subslice 0 EU Typed Reads subslice 0."
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="eu_typed_reads0"
+             units="messages"
+             symbol_name="EuTypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="UntypedReadsPerCacheLine"
+             description="The ratio of EU untyped read requests to L3 cache line reads."
+             data_type="float"
+             equation="$EuUntypedReads0 $EuA64UntypedReads0 UADD $UntypedReads0 FDIV"
+             underscore_name="untyped_reads_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="UntypedReadsPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="TypedReadsPerCacheLine"
+             description="The ratio of EU typed read requests to L3 cache line reads."
+             data_type="float"
+             equation="$EuTypedReads0 $TypedReads0 FDIV"
+             underscore_name="typed_reads_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="TypedReadsPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="EU Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_send_active"
+             units="percent"
+             symbol_name="EuSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x106C00E0" />
+        <register type="NOA" address="0x00009888" value="0x141C8160" />
+        <register type="NOA" address="0x00009888" value="0x161C8015" />
+        <register type="NOA" address="0x00009888" value="0x181C0120" />
+        <register type="NOA" address="0x00009888" value="0x004E8000" />
+        <register type="NOA" address="0x00009888" value="0x0E4E8000" />
+        <register type="NOA" address="0x00009888" value="0x184E8000" />
+        <register type="NOA" address="0x00009888" value="0x1A4EAAA0" />
+        <register type="NOA" address="0x00009888" value="0x1C4E0002" />
+        <register type="NOA" address="0x00009888" value="0x024E8000" />
+        <register type="NOA" address="0x00009888" value="0x044E8000" />
+        <register type="NOA" address="0x00009888" value="0x064E8000" />
+        <register type="NOA" address="0x00009888" value="0x084E8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4E8000" />
+        <register type="NOA" address="0x00009888" value="0x0E6C0B01" />
+        <register type="NOA" address="0x00009888" value="0x006C0200" />
+        <register type="NOA" address="0x00009888" value="0x026C000C" />
+        <register type="NOA" address="0x00009888" value="0x1C6C0000" />
+        <register type="NOA" address="0x00009888" value="0x1E6C0000" />
+        <register type="NOA" address="0x00009888" value="0x1A6C0000" />
+        <register type="NOA" address="0x00009888" value="0x0E1BC000" />
+        <register type="NOA" address="0x00009888" value="0x001B8000" />
+        <register type="NOA" address="0x00009888" value="0x021BC000" />
+        <register type="NOA" address="0x00009888" value="0x001C0041" />
+        <register type="NOA" address="0x00009888" value="0x061C4200" />
+        <register type="NOA" address="0x00009888" value="0x081C4443" />
+        <register type="NOA" address="0x00009888" value="0x0A1C4645" />
+        <register type="NOA" address="0x00009888" value="0x0C1C7647" />
+        <register type="NOA" address="0x00009888" value="0x041C7357" />
+        <register type="NOA" address="0x00009888" value="0x1C1C0030" />
+        <register type="NOA" address="0x00009888" value="0x101C0000" />
+        <register type="NOA" address="0x00009888" value="0x1A1C0000" />
+        <register type="NOA" address="0x00009888" value="0x121C8000" />
+        <register type="NOA" address="0x00009888" value="0x004C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4CAA2A" />
+        <register type="NOA" address="0x00009888" value="0x0C4C02AA" />
+        <register type="NOA" address="0x00009888" value="0x084CA000" />
+        <register type="NOA" address="0x00009888" value="0x000DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D8000" />
+        <register type="NOA" address="0x00009888" value="0x080DA000" />
+        <register type="NOA" address="0x00009888" value="0x0A0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0E0DA000" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F5400" />
+        <register type="NOA" address="0x00009888" value="0x0E0F5515" />
+        <register type="NOA" address="0x00009888" value="0x100F0155" />
+        <register type="NOA" address="0x00009888" value="0x002C8000" />
+        <register type="NOA" address="0x00009888" value="0x0E2C8000" />
+        <register type="NOA" address="0x00009888" value="0x162CAA00" />
+        <register type="NOA" address="0x00009888" value="0x182C00AA" />
+        <register type="NOA" address="0x00009888" value="0x022C8000" />
+        <register type="NOA" address="0x00009888" value="0x042C8000" />
+        <register type="NOA" address="0x00009888" value="0x062C8000" />
+        <register type="NOA" address="0x00009888" value="0x082C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x11907FFF" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900040" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900802" />
+        <register type="NOA" address="0x00009888" value="0x47900842" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900842" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900000" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x43900800" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007FC2A" />
+        <register type="OA" address="0x00002774" value="0x0000BF00" />
+        <register type="OA" address="0x00002778" value="0x0007FC6A" />
+        <register type="OA" address="0x0000277C" value="0x0000BF00" />
+        <register type="OA" address="0x00002780" value="0x0007FC92" />
+        <register type="OA" address="0x00002784" value="0x0000BF00" />
+        <register type="OA" address="0x00002788" value="0x0007FCA2" />
+        <register type="OA" address="0x0000278C" value="0x0000BF00" />
+        <register type="OA" address="0x00002790" value="0x0007FC32" />
+        <register type="OA" address="0x00002794" value="0x0000BF00" />
+        <register type="OA" address="0x00002798" value="0x0007FC9A" />
+        <register type="OA" address="0x0000279C" value="0x0000BF00" />
+        <register type="OA" address="0x000027A0" value="0x0007FE6A" />
+        <register type="OA" address="0x000027A4" value="0x0000BF00" />
+        <register type="OA" address="0x000027A8" value="0x0007FE7A" />
+        <register type="OA" address="0x000027AC" value="0x0000BF00" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00000003" />
+        <register type="FLEX" address="0x0000E658" value="0x00002001" />
+        <register type="FLEX" address="0x0000E758" value="0x00778008" />
+        <register type="FLEX" address="0x0000E45C" value="0x00088078" />
+        <register type="FLEX" address="0x0000E55C" value="0x00808708" />
+        <register type="FLEX" address="0x0000E65C" value="0x00A08908" />
+    </register_config>
+  </set>
+
+  <set name="Compute Metrics L3 Cache Gen9"
+       mdapi_supported_apis="VK OGL4 OCL IO BB"
+       underscore_name="compute_l3_cache"
+       hw_config_guid="0e22f995-79ca-4f67-83ab-e9d9772488d8"
+       chipset="KBLGT2"
+       symbol_name="ComputeL3Cache"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Bank 03 Accesses"
+             description="The total number of accesses to L3 Bank 03."
+             data_type="uint64"
+             equation="B 3 READ 2 UMUL"
+             underscore_name="l3_bank03_accesses"
+             units="messages"
+             symbol_name="L3Bank03Accesses"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="L3 Accesses"
+             description="The total number of L3 accesses from all entities."
+             data_type="uint64"
+             equation="C 0 READ C 1 READ B 2 READ B 3 READ UADD UADD UADD 2 UMUL"
+             underscore_name="l3_accesses"
+             units="messages"
+             symbol_name="L3Accesses"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Sampler Throughput"
+             description="The total number of GPU memory bytes transferred between samplers and L3 caches."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 29 READ 64 UMUL"
+             underscore_name="l3_sampler_throughput"
+             units="bytes"
+             symbol_name="L3SamplerThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Sampler"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu0_active"
+             units="percent"
+             symbol_name="Fpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active"
+             units="percent"
+             symbol_name="Fpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU AVG IPC Rate"
+             description="The average rate of IPC calculated for 2 FPU pipelines."
+             data_type="float"
+             max_equation="2"
+             equation="A 9 READ  A 10 READ  A 11 READ UADD  A 9 READ USUB FDIV 1 FADD"
+             underscore_name="eu_avg_ipc_rate"
+             units="number"
+             symbol_name="EuAvgIpcRate"
+             semantic_type="ratio"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Binary Instruction"
+             description="The percentage of time in which execution units were actively processing binary instructions on FPU0."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_binary_fpu0_instruction"
+             units="percent"
+             symbol_name="EuBinaryFpu0Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="EU FPU0 Hybrid Instruction"
+             description="The percentage of time in which execution units were actively processing hybrid instructions on FPU0."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_hybrid_fpu0_instruction"
+             units="percent"
+             symbol_name="EuHybridFpu0Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Misses"
+             description="The total number of L3 misses."
+             data_type="uint64"
+             equation="C 4 READ C 5 READ UADD"
+             underscore_name="l3_misses"
+             units="messages"
+             symbol_name="L3Misses"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/TAG"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="L3 Bank 00 Accesses"
+             description="The total number of accesses to L3 Bank 00."
+             data_type="uint64"
+             equation="C 0 READ 2 UMUL"
+             underscore_name="l3_bank00_accesses"
+             units="messages"
+             symbol_name="L3Bank00Accesses"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="EU FPU0 Move Instruction"
+             description="The percentage of time in which execution units were actively processing move instructions on FPU0."
+             data_type="float"
+             max_equation="100"
+             equation="A 19 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_move_fpu0_instruction"
+             units="percent"
+             symbol_name="EuMoveFpu0Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU FPU1 Hybrid Instruction"
+             description="The percentage of time in which execution units were actively processing hybrid instructions on FPU1."
+             data_type="float"
+             max_equation="100"
+             equation="A 14 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_hybrid_fpu1_instruction"
+             units="percent"
+             symbol_name="EuHybridFpu1Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Read Throughput"
+             description="The total number of GPU memory bytes read from GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="C 6 READ 64 UMUL"
+             underscore_name="gti_read_throughput"
+             units="bytes"
+             symbol_name="GtiReadThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI L3 Throughput"
+             description="The total number of GPU memory bytes transferred between L3 caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 4 READ C 5 READ UADD 64 UMUL"
+             underscore_name="gti_l3_throughput"
+             units="bytes"
+             symbol_name="GtiL3Throughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Bank 00 IC Accesses"
+             description="The total number of accesses to L3 Bank 00 from IC cache."
+             data_type="uint64"
+             equation="B 0 READ B 1 READ UADD 2 UMUL $L3Bank00Accesses UMIN"
+             underscore_name="l3_bank00_ic_accesses"
+             units="messages"
+             symbol_name="L3Bank00IcAccesses"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3/IC"
+             />
+    <counter name="L3 Bank 00 IC Hits"
+             description="The total number of hits in L3 Bank 00 from IC cache."
+             data_type="uint64"
+             equation="B 1 READ 2 UMUL $L3Bank00IcAccesses UMIN"
+             underscore_name="l3_bank00_ic_hits"
+             units="messages"
+             symbol_name="L3Bank00IcHits"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3/IC"
+             />
+    <counter name="Sampler Accesses"
+             description="The total number of messages send to samplers."
+             data_type="uint64"
+             equation="A 28 READ"
+             underscore_name="sampler_accesses"
+             units="messages"
+             symbol_name="SamplerAccesses"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler"
+             />
+    <counter name="L3 Bank 01 Accesses"
+             description="The total number of accesses to L3 Bank 01."
+             data_type="uint64"
+             equation="C 1 READ 2 UMUL"
+             underscore_name="l3_bank01_accesses"
+             units="messages"
+             symbol_name="L3Bank01Accesses"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Ternary Instruction"
+             description="The percentage of time in which execution units were actively processing ternary instructions on FPU0."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_ternary_fpu0_instruction"
+             units="percent"
+             symbol_name="EuTernaryFpu0Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU FPU1 Move Instruction"
+             description="The percentage of time in which execution units were actively processing move instructions on FPU1."
+             data_type="float"
+             max_equation="100"
+             equation="A 20 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_move_fpu1_instruction"
+             units="percent"
+             symbol_name="EuMoveFpu1Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="L3 Bank 02 Accesses"
+             description="The total number of accesses to L3 Bank 02."
+             data_type="uint64"
+             equation="B 2 READ 2 UMUL"
+             underscore_name="l3_bank02_accesses"
+             units="messages"
+             symbol_name="L3Bank02Accesses"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="L3 Total Throughput"
+             description="The total number of GPU memory bytes transferred via L3."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="$L3Accesses 64 UMUL"
+             underscore_name="l3_total_throughput"
+             units="bytes"
+             symbol_name="L3TotalThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Write Throughput"
+             description="The total number of GPU memory bytes written to GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 32 UMUL"
+             equation="C 7 READ 64 UMUL"
+             underscore_name="gti_write_throughput"
+             units="bytes"
+             symbol_name="GtiWriteThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="EU FPU1 Binary Instruction"
+             description="The percentage of time in which execution units were actively processing binary instructions on FPU1."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_binary_fpu1_instruction"
+             units="percent"
+             symbol_name="EuBinaryFpu1Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Ternary Instruction"
+             description="The percentage of time in which execution units were actively processing ternary instructions on FPU1."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_ternary_fpu1_instruction"
+             units="percent"
+             symbol_name="EuTernaryFpu1Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_send_active"
+             units="percent"
+             symbol_name="EuSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x166C0760" />
+        <register type="NOA" address="0x00009888" value="0x1593001E" />
+        <register type="NOA" address="0x00009888" value="0x3F900003" />
+        <register type="NOA" address="0x00009888" value="0x004E8000" />
+        <register type="NOA" address="0x00009888" value="0x0E4E8000" />
+        <register type="NOA" address="0x00009888" value="0x184E8000" />
+        <register type="NOA" address="0x00009888" value="0x1A4E8020" />
+        <register type="NOA" address="0x00009888" value="0x1C4E0002" />
+        <register type="NOA" address="0x00009888" value="0x006C0051" />
+        <register type="NOA" address="0x00009888" value="0x066C5000" />
+        <register type="NOA" address="0x00009888" value="0x086C5C5D" />
+        <register type="NOA" address="0x00009888" value="0x0E6C5E5F" />
+        <register type="NOA" address="0x00009888" value="0x106C0000" />
+        <register type="NOA" address="0x00009888" value="0x186C0000" />
+        <register type="NOA" address="0x00009888" value="0x1C6C0000" />
+        <register type="NOA" address="0x00009888" value="0x1E6C0000" />
+        <register type="NOA" address="0x00009888" value="0x001B4000" />
+        <register type="NOA" address="0x00009888" value="0x061B8000" />
+        <register type="NOA" address="0x00009888" value="0x081BC000" />
+        <register type="NOA" address="0x00009888" value="0x0E1BC000" />
+        <register type="NOA" address="0x00009888" value="0x101C8000" />
+        <register type="NOA" address="0x00009888" value="0x1A1CE000" />
+        <register type="NOA" address="0x00009888" value="0x1C1C0030" />
+        <register type="NOA" address="0x00009888" value="0x004C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C2A00" />
+        <register type="NOA" address="0x00009888" value="0x0C4C0280" />
+        <register type="NOA" address="0x00009888" value="0x000D2000" />
+        <register type="NOA" address="0x00009888" value="0x060D8000" />
+        <register type="NOA" address="0x00009888" value="0x080DA000" />
+        <register type="NOA" address="0x00009888" value="0x0E0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F0400" />
+        <register type="NOA" address="0x00009888" value="0x0E0F1500" />
+        <register type="NOA" address="0x00009888" value="0x100F0140" />
+        <register type="NOA" address="0x00009888" value="0x002C8000" />
+        <register type="NOA" address="0x00009888" value="0x0E2C8000" />
+        <register type="NOA" address="0x00009888" value="0x162C0A00" />
+        <register type="NOA" address="0x00009888" value="0x182C00A0" />
+        <register type="NOA" address="0x00009888" value="0x03933300" />
+        <register type="NOA" address="0x00009888" value="0x05930032" />
+        <register type="NOA" address="0x00009888" value="0x11930000" />
+        <register type="NOA" address="0x00009888" value="0x1B930000" />
+        <register type="NOA" address="0x00009888" value="0x1D900157" />
+        <register type="NOA" address="0x00009888" value="0x1F900158" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B908000" />
+        <register type="NOA" address="0x00009888" value="0x1190030F" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900000" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900021" />
+        <register type="NOA" address="0x00009888" value="0x47900000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900000" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x53904444" />
+        <register type="NOA" address="0x00009888" value="0x43900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x30800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x30800000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007FFFA" />
+        <register type="OA" address="0x00002774" value="0x0000FEFE" />
+        <register type="OA" address="0x00002778" value="0x0007FFFA" />
+        <register type="OA" address="0x0000277C" value="0x0000FEFD" />
+        <register type="OA" address="0x00002790" value="0x0007FFFA" />
+        <register type="OA" address="0x00002794" value="0x0000FBEF" />
+        <register type="OA" address="0x00002798" value="0x0007FFFA" />
+        <register type="OA" address="0x0000279C" value="0x0000FBDF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00000003" />
+        <register type="FLEX" address="0x0000E658" value="0x00002001" />
+        <register type="FLEX" address="0x0000E758" value="0x00101100" />
+        <register type="FLEX" address="0x0000E45C" value="0x00201200" />
+        <register type="FLEX" address="0x0000E55C" value="0x00301300" />
+        <register type="FLEX" address="0x0000E65C" value="0x00401400" />
+    </register_config>
+  </set>
+
+  <set name="Metric set HDCAndSF"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="hdc_and_sf"
+       hw_config_guid="fb149d66-fad2-4230-b0d7-4d689b9116d3"
+       chipset="KBLGT2"
+       symbol_name="HDCAndSF"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="Polygon Data Ready"
+             description="The percentage of time in which geometry pipeline output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="poly_data_ready"
+             units="percent"
+             symbol_name="PolyDataReady"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe/Strip-Fans"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="HDC stalled by L3 (s0.ss1)"
+             description="Percentage of time when HDC has messges to L3, but it's stalled due to lack of credits (s0.ss1)"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ C 4 READ USUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader01_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader01AccessStalledOnL3"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="HDC stalled by L3 (s0.ss2)"
+             description="Percentage of time when HDC has messges to L3, but it's stalled due to lack of credits (s0.ss2)"
+             data_type="float"
+             max_equation="100"
+             equation="C 3 READ C 2 READ USUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader02_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader02AccessStalledOnL3"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="HDC stalled by L3 (s0.ss0)"
+             description="Percentage of time when HDC has messges to L3, but it's stalled due to lack of credits (s0.ss0)"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ C 6 READ USUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader00_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader00AccessStalledOnL3"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x104F0232" />
+        <register type="NOA" address="0x00009888" value="0x124F4640" />
+        <register type="NOA" address="0x00009888" value="0x106C0232" />
+        <register type="NOA" address="0x00009888" value="0x11834400" />
+        <register type="NOA" address="0x00009888" value="0x0A4E8000" />
+        <register type="NOA" address="0x00009888" value="0x0C4E8000" />
+        <register type="NOA" address="0x00009888" value="0x004F1880" />
+        <register type="NOA" address="0x00009888" value="0x024F08BB" />
+        <register type="NOA" address="0x00009888" value="0x044F001B" />
+        <register type="NOA" address="0x00009888" value="0x046C0100" />
+        <register type="NOA" address="0x00009888" value="0x066C000B" />
+        <register type="NOA" address="0x00009888" value="0x1A6C0000" />
+        <register type="NOA" address="0x00009888" value="0x041B8000" />
+        <register type="NOA" address="0x00009888" value="0x061B4000" />
+        <register type="NOA" address="0x00009888" value="0x1A1C1800" />
+        <register type="NOA" address="0x00009888" value="0x005B8000" />
+        <register type="NOA" address="0x00009888" value="0x025BC000" />
+        <register type="NOA" address="0x00009888" value="0x045B4000" />
+        <register type="NOA" address="0x00009888" value="0x125C8000" />
+        <register type="NOA" address="0x00009888" value="0x145C8000" />
+        <register type="NOA" address="0x00009888" value="0x165C8000" />
+        <register type="NOA" address="0x00009888" value="0x185C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C00A0" />
+        <register type="NOA" address="0x00009888" value="0x000D8000" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F5000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0055" />
+        <register type="NOA" address="0x00009888" value="0x022CC000" />
+        <register type="NOA" address="0x00009888" value="0x042CC000" />
+        <register type="NOA" address="0x00009888" value="0x062CC000" />
+        <register type="NOA" address="0x00009888" value="0x082CC000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0F828000" />
+        <register type="NOA" address="0x00009888" value="0x0F8305C0" />
+        <register type="NOA" address="0x00009888" value="0x09830000" />
+        <register type="NOA" address="0x00009888" value="0x07830000" />
+        <register type="NOA" address="0x00009888" value="0x1D950080" />
+        <register type="NOA" address="0x00009888" value="0x13928000" />
+        <register type="NOA" address="0x00009888" value="0x0F988000" />
+        <register type="NOA" address="0x00009888" value="0x31904000" />
+        <register type="NOA" address="0x00009888" value="0x1190FC00" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900040" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900800" />
+        <register type="NOA" address="0x00009888" value="0x43900842" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x10800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00000002" />
+        <register type="OA" address="0x00002774" value="0x0000FDFF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set L3_1"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="l3_1"
+       hw_config_guid="f889f8cc-4c93-4ac8-b75f-551c0b9b87f7"
+       chipset="KBLGT2"
+       symbol_name="L3_1"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank1 Active"
+             description="The percentage of time in which slice0 L3 bank1 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank1_active"
+             units="percent"
+             symbol_name="L30Bank1Active"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="Slice0 L3 Bank1 Stalled"
+             description="The percentage of time in which slice0 L3 bank1 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank1_stalled"
+             units="percent"
+             symbol_name="L30Bank1Stalled"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank0 Active"
+             description="The percentage of time in which slice0 L3 bank0 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank0_active"
+             units="percent"
+             symbol_name="L30Bank0Active"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank0 Stalled"
+             description="The percentage of time in which slice0 L3 bank0 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank0_stalled"
+             units="percent"
+             symbol_name="L30Bank0Stalled"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x126C7B40" />
+        <register type="NOA" address="0x00009888" value="0x166C0020" />
+        <register type="NOA" address="0x00009888" value="0x0A603444" />
+        <register type="NOA" address="0x00009888" value="0x0A613400" />
+        <register type="NOA" address="0x00009888" value="0x1A4EA800" />
+        <register type="NOA" address="0x00009888" value="0x1C4E0002" />
+        <register type="NOA" address="0x00009888" value="0x024E8000" />
+        <register type="NOA" address="0x00009888" value="0x044E8000" />
+        <register type="NOA" address="0x00009888" value="0x064E8000" />
+        <register type="NOA" address="0x00009888" value="0x084E8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4E8000" />
+        <register type="NOA" address="0x00009888" value="0x064F4000" />
+        <register type="NOA" address="0x00009888" value="0x0C6C5327" />
+        <register type="NOA" address="0x00009888" value="0x0E6C5425" />
+        <register type="NOA" address="0x00009888" value="0x006C2A00" />
+        <register type="NOA" address="0x00009888" value="0x026C285B" />
+        <register type="NOA" address="0x00009888" value="0x046C005C" />
+        <register type="NOA" address="0x00009888" value="0x106C0000" />
+        <register type="NOA" address="0x00009888" value="0x1C6C0000" />
+        <register type="NOA" address="0x00009888" value="0x1E6C0000" />
+        <register type="NOA" address="0x00009888" value="0x1A6C0800" />
+        <register type="NOA" address="0x00009888" value="0x0C1BC000" />
+        <register type="NOA" address="0x00009888" value="0x0E1BC000" />
+        <register type="NOA" address="0x00009888" value="0x001B8000" />
+        <register type="NOA" address="0x00009888" value="0x021BC000" />
+        <register type="NOA" address="0x00009888" value="0x041BC000" />
+        <register type="NOA" address="0x00009888" value="0x1C1C003C" />
+        <register type="NOA" address="0x00009888" value="0x121C8000" />
+        <register type="NOA" address="0x00009888" value="0x141C8000" />
+        <register type="NOA" address="0x00009888" value="0x161C8000" />
+        <register type="NOA" address="0x00009888" value="0x181C8000" />
+        <register type="NOA" address="0x00009888" value="0x1A1C0800" />
+        <register type="NOA" address="0x00009888" value="0x065B4000" />
+        <register type="NOA" address="0x00009888" value="0x1A5C1000" />
+        <register type="NOA" address="0x00009888" value="0x10600000" />
+        <register type="NOA" address="0x00009888" value="0x04600000" />
+        <register type="NOA" address="0x00009888" value="0x0C610044" />
+        <register type="NOA" address="0x00009888" value="0x10610000" />
+        <register type="NOA" address="0x00009888" value="0x06610000" />
+        <register type="NOA" address="0x00009888" value="0x0C4C02A8" />
+        <register type="NOA" address="0x00009888" value="0x084CA000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C002A" />
+        <register type="NOA" address="0x00009888" value="0x0C0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0E0DA000" />
+        <register type="NOA" address="0x00009888" value="0x000D8000" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x100F0154" />
+        <register type="NOA" address="0x00009888" value="0x0C0F5000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0055" />
+        <register type="NOA" address="0x00009888" value="0x182C00AA" />
+        <register type="NOA" address="0x00009888" value="0x022C8000" />
+        <register type="NOA" address="0x00009888" value="0x042C8000" />
+        <register type="NOA" address="0x00009888" value="0x062C8000" />
+        <register type="NOA" address="0x00009888" value="0x082C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C2CC000" />
+        <register type="NOA" address="0x00009888" value="0x1190FFC0" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900420" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900021" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900400" />
+        <register type="NOA" address="0x00009888" value="0x43900421" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900040" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002770" value="0x00100070" />
+        <register type="OA" address="0x00002774" value="0x0000FFF1" />
+        <register type="OA" address="0x00002778" value="0x00014002" />
+        <register type="OA" address="0x0000277C" value="0x0000C3FF" />
+        <register type="OA" address="0x00002780" value="0x00010002" />
+        <register type="OA" address="0x00002784" value="0x0000C7FF" />
+        <register type="OA" address="0x00002788" value="0x00004002" />
+        <register type="OA" address="0x0000278C" value="0x0000D3FF" />
+        <register type="OA" address="0x00002790" value="0x00100700" />
+        <register type="OA" address="0x00002794" value="0x0000FF1F" />
+        <register type="OA" address="0x00002798" value="0x00001402" />
+        <register type="OA" address="0x0000279C" value="0x0000FC3F" />
+        <register type="OA" address="0x000027A0" value="0x00001002" />
+        <register type="OA" address="0x000027A4" value="0x0000FC7F" />
+        <register type="OA" address="0x000027A8" value="0x00000402" />
+        <register type="OA" address="0x000027AC" value="0x0000FD3F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set L3_2"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="l3_2"
+       hw_config_guid="6d344efd-8e9e-42d4-a29e-1011c29f82c2"
+       chipset="KBLGT2"
+       symbol_name="L3_2"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank2 Stalled"
+             description="The percentage of time in which slice0 L3 bank2 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank2_stalled"
+             units="percent"
+             symbol_name="L30Bank2Stalled"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank2 Active"
+             description="The percentage of time in which slice0 L3 bank2 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank2_active"
+             units="percent"
+             symbol_name="L30Bank2Active"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x126C02E0" />
+        <register type="NOA" address="0x00009888" value="0x146C0001" />
+        <register type="NOA" address="0x00009888" value="0x0A623400" />
+        <register type="NOA" address="0x00009888" value="0x044E8000" />
+        <register type="NOA" address="0x00009888" value="0x064E8000" />
+        <register type="NOA" address="0x00009888" value="0x084E8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4E8000" />
+        <register type="NOA" address="0x00009888" value="0x064F4000" />
+        <register type="NOA" address="0x00009888" value="0x026C3324" />
+        <register type="NOA" address="0x00009888" value="0x046C3422" />
+        <register type="NOA" address="0x00009888" value="0x106C0000" />
+        <register type="NOA" address="0x00009888" value="0x1A6C0000" />
+        <register type="NOA" address="0x00009888" value="0x021BC000" />
+        <register type="NOA" address="0x00009888" value="0x041BC000" />
+        <register type="NOA" address="0x00009888" value="0x141C8000" />
+        <register type="NOA" address="0x00009888" value="0x161C8000" />
+        <register type="NOA" address="0x00009888" value="0x181C8000" />
+        <register type="NOA" address="0x00009888" value="0x1A1C0800" />
+        <register type="NOA" address="0x00009888" value="0x065B4000" />
+        <register type="NOA" address="0x00009888" value="0x1A5C1000" />
+        <register type="NOA" address="0x00009888" value="0x06614000" />
+        <register type="NOA" address="0x00009888" value="0x0C620044" />
+        <register type="NOA" address="0x00009888" value="0x10620000" />
+        <register type="NOA" address="0x00009888" value="0x06620000" />
+        <register type="NOA" address="0x00009888" value="0x084C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C002A" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F4000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0055" />
+        <register type="NOA" address="0x00009888" value="0x042C8000" />
+        <register type="NOA" address="0x00009888" value="0x062C8000" />
+        <register type="NOA" address="0x00009888" value="0x082C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C2CC000" />
+        <register type="NOA" address="0x00009888" value="0x1190F800" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x43900000" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00100070" />
+        <register type="OA" address="0x00002774" value="0x0000FFF1" />
+        <register type="OA" address="0x00002778" value="0x00028002" />
+        <register type="OA" address="0x0000277C" value="0x000087FF" />
+        <register type="OA" address="0x00002780" value="0x00020002" />
+        <register type="OA" address="0x00002784" value="0x00008FFF" />
+        <register type="OA" address="0x00002788" value="0x00008002" />
+        <register type="OA" address="0x0000278C" value="0x0000A7FF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set L3_3"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="l3_3"
+       hw_config_guid="e3b386ae-c195-47d5-af29-8a1afa0ae2bf"
+       chipset="KBLGT2"
+       symbol_name="L3_3"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Slice0 L3 Bank3 Stalled"
+             description="The percentage of time in which slice0 L3 bank3 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank3_stalled"
+             units="percent"
+             symbol_name="L30Bank3Stalled"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank3 Active"
+             description="The percentage of time in which slice0 L3 bank3 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank3_active"
+             units="percent"
+             symbol_name="L30Bank3Active"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x126C4E80" />
+        <register type="NOA" address="0x00009888" value="0x146C0000" />
+        <register type="NOA" address="0x00009888" value="0x0A633400" />
+        <register type="NOA" address="0x00009888" value="0x044E8000" />
+        <register type="NOA" address="0x00009888" value="0x064E8000" />
+        <register type="NOA" address="0x00009888" value="0x084E8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4E8000" />
+        <register type="NOA" address="0x00009888" value="0x0C4E8000" />
+        <register type="NOA" address="0x00009888" value="0x026C3321" />
+        <register type="NOA" address="0x00009888" value="0x046C342F" />
+        <register type="NOA" address="0x00009888" value="0x106C0000" />
+        <register type="NOA" address="0x00009888" value="0x1A6C2000" />
+        <register type="NOA" address="0x00009888" value="0x021BC000" />
+        <register type="NOA" address="0x00009888" value="0x041BC000" />
+        <register type="NOA" address="0x00009888" value="0x061B4000" />
+        <register type="NOA" address="0x00009888" value="0x141C8000" />
+        <register type="NOA" address="0x00009888" value="0x161C8000" />
+        <register type="NOA" address="0x00009888" value="0x181C8000" />
+        <register type="NOA" address="0x00009888" value="0x1A1C1800" />
+        <register type="NOA" address="0x00009888" value="0x06604000" />
+        <register type="NOA" address="0x00009888" value="0x0C630044" />
+        <register type="NOA" address="0x00009888" value="0x10630000" />
+        <register type="NOA" address="0x00009888" value="0x06630000" />
+        <register type="NOA" address="0x00009888" value="0x084C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C00AA" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F4000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0055" />
+        <register type="NOA" address="0x00009888" value="0x042C8000" />
+        <register type="NOA" address="0x00009888" value="0x062C8000" />
+        <register type="NOA" address="0x00009888" value="0x082C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C2C8000" />
+        <register type="NOA" address="0x00009888" value="0x1190F800" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x43900842" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900002" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00100070" />
+        <register type="OA" address="0x00002774" value="0x0000FFF1" />
+        <register type="OA" address="0x00002778" value="0x00028002" />
+        <register type="OA" address="0x0000277C" value="0x000087FF" />
+        <register type="OA" address="0x00002780" value="0x00020002" />
+        <register type="OA" address="0x00002784" value="0x00008FFF" />
+        <register type="OA" address="0x00002788" value="0x00008002" />
+        <register type="OA" address="0x0000278C" value="0x0000A7FF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set RasterizerAndPixelBackend"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="rasterizer_and_pixel_backend"
+       hw_config_guid="f9954679-a055-4862-9f57-9d66e3ebf81c"
+       chipset="KBLGT2"
+       symbol_name="RasterizerAndPixelBackend"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Slice0 Pixel Values Ready"
+             description="The percentage of time in which slice0 pixel values are ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="pixel_values0_ready"
+             units="percent"
+             symbol_name="PixelValues0Ready"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="Slice0 Rasterizer Input Available"
+             description="The percentage of time in which slice0 rasterizer input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="rasterizer0_input_available"
+             units="percent"
+             symbol_name="Rasterizer0InputAvailable"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Slice0 Post-EarlyZ Pixel Data Ready"
+             description="The percentage of time in which slice0 post-EarlyZ pixel data is ready (after early Z tests have been applied)"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="pixel_data0_ready"
+             units="percent"
+             symbol_name="PixelData0Ready"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer/Early Depth Test"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 Rasterizer Output Ready"
+             description="The percentage of time in which slice0 rasterizer output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="rasterizer0_output_ready"
+             units="percent"
+             symbol_name="Rasterizer0OutputReady"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Slice0 PS Output Available"
+             description="The percentage of time in which slice0 PS output is available"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_output0_available"
+             units="percent"
+             symbol_name="PSOutput0Available"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x102F3800" />
+        <register type="NOA" address="0x00009888" value="0x144D0500" />
+        <register type="NOA" address="0x00009888" value="0x120D03C0" />
+        <register type="NOA" address="0x00009888" value="0x140D03CF" />
+        <register type="NOA" address="0x00009888" value="0x0C0F0004" />
+        <register type="NOA" address="0x00009888" value="0x0C4E4000" />
+        <register type="NOA" address="0x00009888" value="0x042F0480" />
+        <register type="NOA" address="0x00009888" value="0x082F0000" />
+        <register type="NOA" address="0x00009888" value="0x022F0000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C0090" />
+        <register type="NOA" address="0x00009888" value="0x064D0027" />
+        <register type="NOA" address="0x00009888" value="0x004D0000" />
+        <register type="NOA" address="0x00009888" value="0x000D0D40" />
+        <register type="NOA" address="0x00009888" value="0x020D803F" />
+        <register type="NOA" address="0x00009888" value="0x040D8023" />
+        <register type="NOA" address="0x00009888" value="0x100D0000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x020F0010" />
+        <register type="NOA" address="0x00009888" value="0x000F0000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0050" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C2C8000" />
+        <register type="NOA" address="0x00009888" value="0x1190FC00" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41901400" />
+        <register type="NOA" address="0x00009888" value="0x43901485" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900001" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x30800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00000002" />
+        <register type="OA" address="0x00002774" value="0x0000EFFF" />
+        <register type="OA" address="0x00002778" value="0x00006000" />
+        <register type="OA" address="0x0000277C" value="0x0000F3FF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set Sampler"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="sampler"
+       hw_config_guid="4ed5e27e-fd1a-4f11-ad8f-9374e128c697"
+       chipset="KBLGT2"
+       symbol_name="Sampler"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 Subslice2 Input Available"
+             description="The percentage of time in which slice0 subslice2 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler02_input_available"
+             units="percent"
+             symbol_name="Sampler02InputAvailable"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 Subslice0 Input Available"
+             description="The percentage of time in which slice0 subslice0 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler00_input_available"
+             units="percent"
+             symbol_name="Sampler00InputAvailable"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="Slice0 Subslice2 Sampler Output Ready"
+             description="The percentage of time in which slice0 subslice2 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler02_output_ready"
+             units="percent"
+             symbol_name="Sampler02OutputReady"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Slice0 Subslice1 Input Available"
+             description="The percentage of time in which slice0 subslice1 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler01_input_available"
+             units="percent"
+             symbol_name="Sampler01InputAvailable"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Slice0 Subslice0 Sampler Output Ready"
+             description="The percentage of time in which slice0 subslice0 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler00_output_ready"
+             units="percent"
+             symbol_name="Sampler00OutputReady"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Slice0 Subslice1 Sampler Output Ready"
+             description="The percentage of time in which slice0 subslice1 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler01_output_ready"
+             units="percent"
+             symbol_name="Sampler01OutputReady"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x14152C00" />
+        <register type="NOA" address="0x00009888" value="0x16150005" />
+        <register type="NOA" address="0x00009888" value="0x121600A0" />
+        <register type="NOA" address="0x00009888" value="0x14352C00" />
+        <register type="NOA" address="0x00009888" value="0x16350005" />
+        <register type="NOA" address="0x00009888" value="0x123600A0" />
+        <register type="NOA" address="0x00009888" value="0x14552C00" />
+        <register type="NOA" address="0x00009888" value="0x16550005" />
+        <register type="NOA" address="0x00009888" value="0x125600A0" />
+        <register type="NOA" address="0x00009888" value="0x062F6000" />
+        <register type="NOA" address="0x00009888" value="0x022F2000" />
+        <register type="NOA" address="0x00009888" value="0x0C4C0050" />
+        <register type="NOA" address="0x00009888" value="0x0A4C0010" />
+        <register type="NOA" address="0x00009888" value="0x0C0D8000" />
+        <register type="NOA" address="0x00009888" value="0x0E0DA000" />
+        <register type="NOA" address="0x00009888" value="0x000D8000" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x100F0350" />
+        <register type="NOA" address="0x00009888" value="0x0C0FB000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F00DA" />
+        <register type="NOA" address="0x00009888" value="0x182C0028" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x022DC000" />
+        <register type="NOA" address="0x00009888" value="0x042D4000" />
+        <register type="NOA" address="0x00009888" value="0x0C138000" />
+        <register type="NOA" address="0x00009888" value="0x0E132000" />
+        <register type="NOA" address="0x00009888" value="0x0413C000" />
+        <register type="NOA" address="0x00009888" value="0x1C140018" />
+        <register type="NOA" address="0x00009888" value="0x0C157000" />
+        <register type="NOA" address="0x00009888" value="0x0E150078" />
+        <register type="NOA" address="0x00009888" value="0x10150000" />
+        <register type="NOA" address="0x00009888" value="0x04162180" />
+        <register type="NOA" address="0x00009888" value="0x02160000" />
+        <register type="NOA" address="0x00009888" value="0x04174000" />
+        <register type="NOA" address="0x00009888" value="0x0233A000" />
+        <register type="NOA" address="0x00009888" value="0x04333000" />
+        <register type="NOA" address="0x00009888" value="0x14348000" />
+        <register type="NOA" address="0x00009888" value="0x16348000" />
+        <register type="NOA" address="0x00009888" value="0x02357870" />
+        <register type="NOA" address="0x00009888" value="0x10350000" />
+        <register type="NOA" address="0x00009888" value="0x04360043" />
+        <register type="NOA" address="0x00009888" value="0x02360000" />
+        <register type="NOA" address="0x00009888" value="0x04371000" />
+        <register type="NOA" address="0x00009888" value="0x0E538000" />
+        <register type="NOA" address="0x00009888" value="0x00538000" />
+        <register type="NOA" address="0x00009888" value="0x06533000" />
+        <register type="NOA" address="0x00009888" value="0x1C540020" />
+        <register type="NOA" address="0x00009888" value="0x12548000" />
+        <register type="NOA" address="0x00009888" value="0x0E557000" />
+        <register type="NOA" address="0x00009888" value="0x00557800" />
+        <register type="NOA" address="0x00009888" value="0x10550000" />
+        <register type="NOA" address="0x00009888" value="0x06560043" />
+        <register type="NOA" address="0x00009888" value="0x02560000" />
+        <register type="NOA" address="0x00009888" value="0x06571000" />
+        <register type="NOA" address="0x00009888" value="0x1190FF80" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900060" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900C00" />
+        <register type="NOA" address="0x00009888" value="0x43900842" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900060" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x70800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x0000C000" />
+        <register type="OA" address="0x00002774" value="0x0000E7FF" />
+        <register type="OA" address="0x00002778" value="0x00003000" />
+        <register type="OA" address="0x0000277C" value="0x0000F9FF" />
+        <register type="OA" address="0x00002780" value="0x00000C00" />
+        <register type="OA" address="0x00002784" value="0x0000FE7F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set TDL_1"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="tdl_1"
+       hw_config_guid="9eaf384d-8f53-41b8-a71d-108308780fbc"
+       chipset="KBLGT2"
+       symbol_name="TDL_1"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="NonPS Thread Ready For Dispatch on Slice0 Subslice2"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice2 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread02_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread02ReadyForDispatch"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="NonPS Thread Ready For Dispatch on Slice0 Subslice0"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice0 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread00_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread00ReadyForDispatch"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Subslice0"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice0 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread00_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread00ReadyForDispatch"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Subslice1"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice1 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread01_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread01ReadyForDispatch"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Subslice2"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice2 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread02_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread02ReadyForDispatch"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="NonPS Thread Ready For Dispatch on Slice0 Subslice1"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice1 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread01_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread01ReadyForDispatch"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x12120000" />
+        <register type="NOA" address="0x00009888" value="0x12320000" />
+        <register type="NOA" address="0x00009888" value="0x12520000" />
+        <register type="NOA" address="0x00009888" value="0x002F8000" />
+        <register type="NOA" address="0x00009888" value="0x022F3000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C0015" />
+        <register type="NOA" address="0x00009888" value="0x0C0D8000" />
+        <register type="NOA" address="0x00009888" value="0x0E0DA000" />
+        <register type="NOA" address="0x00009888" value="0x000D8000" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x100F03A0" />
+        <register type="NOA" address="0x00009888" value="0x0C0FF000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0095" />
+        <register type="NOA" address="0x00009888" value="0x062C8000" />
+        <register type="NOA" address="0x00009888" value="0x082C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C2D8000" />
+        <register type="NOA" address="0x00009888" value="0x0E2D4000" />
+        <register type="NOA" address="0x00009888" value="0x062D4000" />
+        <register type="NOA" address="0x00009888" value="0x02108000" />
+        <register type="NOA" address="0x00009888" value="0x0410C000" />
+        <register type="NOA" address="0x00009888" value="0x02118000" />
+        <register type="NOA" address="0x00009888" value="0x0411C000" />
+        <register type="NOA" address="0x00009888" value="0x02121880" />
+        <register type="NOA" address="0x00009888" value="0x041219B5" />
+        <register type="NOA" address="0x00009888" value="0x00120000" />
+        <register type="NOA" address="0x00009888" value="0x02134000" />
+        <register type="NOA" address="0x00009888" value="0x04135000" />
+        <register type="NOA" address="0x00009888" value="0x0C308000" />
+        <register type="NOA" address="0x00009888" value="0x0E304000" />
+        <register type="NOA" address="0x00009888" value="0x06304000" />
+        <register type="NOA" address="0x00009888" value="0x0C318000" />
+        <register type="NOA" address="0x00009888" value="0x0E314000" />
+        <register type="NOA" address="0x00009888" value="0x06314000" />
+        <register type="NOA" address="0x00009888" value="0x0C321A80" />
+        <register type="NOA" address="0x00009888" value="0x0E320033" />
+        <register type="NOA" address="0x00009888" value="0x06320031" />
+        <register type="NOA" address="0x00009888" value="0x00320000" />
+        <register type="NOA" address="0x00009888" value="0x0C334000" />
+        <register type="NOA" address="0x00009888" value="0x0E331000" />
+        <register type="NOA" address="0x00009888" value="0x06331000" />
+        <register type="NOA" address="0x00009888" value="0x0E508000" />
+        <register type="NOA" address="0x00009888" value="0x00508000" />
+        <register type="NOA" address="0x00009888" value="0x02504000" />
+        <register type="NOA" address="0x00009888" value="0x0E518000" />
+        <register type="NOA" address="0x00009888" value="0x00518000" />
+        <register type="NOA" address="0x00009888" value="0x02514000" />
+        <register type="NOA" address="0x00009888" value="0x0E521880" />
+        <register type="NOA" address="0x00009888" value="0x00521A80" />
+        <register type="NOA" address="0x00009888" value="0x02520033" />
+        <register type="NOA" address="0x00009888" value="0x0E534000" />
+        <register type="NOA" address="0x00009888" value="0x00534000" />
+        <register type="NOA" address="0x00009888" value="0x02531000" />
+        <register type="NOA" address="0x00009888" value="0x1190FF80" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900800" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900062" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900C00" />
+        <register type="NOA" address="0x00009888" value="0x43900003" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900040" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x30800000" />
+        <register type="OA" address="0x00002770" value="0x00000002" />
+        <register type="OA" address="0x00002774" value="0x00007FFF" />
+        <register type="OA" address="0x00002778" value="0x00000000" />
+        <register type="OA" address="0x0000277C" value="0x00009FFF" />
+        <register type="OA" address="0x00002780" value="0x00000002" />
+        <register type="OA" address="0x00002784" value="0x0000EFFF" />
+        <register type="OA" address="0x00002788" value="0x00000000" />
+        <register type="OA" address="0x0000278C" value="0x0000F3FF" />
+        <register type="OA" address="0x00002790" value="0x00000002" />
+        <register type="OA" address="0x00002794" value="0x0000FDFF" />
+        <register type="OA" address="0x00002798" value="0x00000000" />
+        <register type="OA" address="0x0000279C" value="0x0000FE7F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set TDL_2"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="tdl_2"
+       hw_config_guid="a00cbdf2-eabd-4240-9a89-86e2ac1ca1e4"
+       chipset="KBLGT2"
+       symbol_name="TDL_2"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice1 Port 0"
+             description="The percentage of time in which thread header is ready on slice0 subslice1 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header01_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader01ReadyPort0"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice1 Port 1"
+             description="The percentage of time in which thread header is ready on slice0 subslice1 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header01_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader01ReadyPort1"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice2 Port 1"
+             description="The percentage of time in which thread header is ready on slice0 subslice2 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header02_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader02ReadyPort1"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice2 Port 0"
+             description="The percentage of time in which thread header is ready on slice0 subslice2 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header02_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader02ReadyPort0"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice0 Port 0"
+             description="The percentage of time in which thread header is ready on slice0 subslice0 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header00_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader00ReadyPort0"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice0 Port 1"
+             description="The percentage of time in which thread header is ready on slice0 subslice0 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header00_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader00ReadyPort1"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x12124D60" />
+        <register type="NOA" address="0x00009888" value="0x12322E60" />
+        <register type="NOA" address="0x00009888" value="0x12524D60" />
+        <register type="NOA" address="0x00009888" value="0x022F3000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C0014" />
+        <register type="NOA" address="0x00009888" value="0x000D8000" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x0C0FE000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0097" />
+        <register type="NOA" address="0x00009888" value="0x082C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x002D8000" />
+        <register type="NOA" address="0x00009888" value="0x062D4000" />
+        <register type="NOA" address="0x00009888" value="0x0410C000" />
+        <register type="NOA" address="0x00009888" value="0x0411C000" />
+        <register type="NOA" address="0x00009888" value="0x04121FB7" />
+        <register type="NOA" address="0x00009888" value="0x00120000" />
+        <register type="NOA" address="0x00009888" value="0x04135000" />
+        <register type="NOA" address="0x00009888" value="0x00308000" />
+        <register type="NOA" address="0x00009888" value="0x06304000" />
+        <register type="NOA" address="0x00009888" value="0x00318000" />
+        <register type="NOA" address="0x00009888" value="0x06314000" />
+        <register type="NOA" address="0x00009888" value="0x00321B80" />
+        <register type="NOA" address="0x00009888" value="0x0632003F" />
+        <register type="NOA" address="0x00009888" value="0x00334000" />
+        <register type="NOA" address="0x00009888" value="0x06331000" />
+        <register type="NOA" address="0x00009888" value="0x0250C000" />
+        <register type="NOA" address="0x00009888" value="0x0251C000" />
+        <register type="NOA" address="0x00009888" value="0x02521FB7" />
+        <register type="NOA" address="0x00009888" value="0x00520000" />
+        <register type="NOA" address="0x00009888" value="0x02535000" />
+        <register type="NOA" address="0x00009888" value="0x1190FC00" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900800" />
+        <register type="NOA" address="0x00009888" value="0x43900063" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900040" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Compute Metrics Extra Gen9"
+       mdapi_supported_apis="VK OGL4 OCL IO BB"
+       underscore_name="compute_extra"
+       hw_config_guid="aa7a3fb9-22fb-43ff-a32d-0ab6c13bbd16"
+       chipset="KBLGT2"
+       symbol_name="ComputeExtra"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active"
+             units="percent"
+             symbol_name="Fpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Pipe Active including Ext Math"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing including Extended Math processing"
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ  C 7 READ C 6 READ FADD C 5 READ FADD 8 FMUL FADD 100 FMUL $EuCoresTotalCount FDIV $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active_adjusted"
+             units="percent"
+             symbol_name="Fpu1ActiveAdjusted"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x121203E0" />
+        <register type="NOA" address="0x00009888" value="0x123203E0" />
+        <register type="NOA" address="0x00009888" value="0x125203E0" />
+        <register type="NOA" address="0x00009888" value="0x022F4000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C0040" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F006C" />
+        <register type="NOA" address="0x00009888" value="0x0C2C8000" />
+        <register type="NOA" address="0x00009888" value="0x042D8000" />
+        <register type="NOA" address="0x00009888" value="0x06104000" />
+        <register type="NOA" address="0x00009888" value="0x06114000" />
+        <register type="NOA" address="0x00009888" value="0x06120033" />
+        <register type="NOA" address="0x00009888" value="0x00120000" />
+        <register type="NOA" address="0x00009888" value="0x06131000" />
+        <register type="NOA" address="0x00009888" value="0x04308000" />
+        <register type="NOA" address="0x00009888" value="0x04318000" />
+        <register type="NOA" address="0x00009888" value="0x04321980" />
+        <register type="NOA" address="0x00009888" value="0x00320000" />
+        <register type="NOA" address="0x00009888" value="0x04334000" />
+        <register type="NOA" address="0x00009888" value="0x04504000" />
+        <register type="NOA" address="0x00009888" value="0x04514000" />
+        <register type="NOA" address="0x00009888" value="0x04520033" />
+        <register type="NOA" address="0x00009888" value="0x00520000" />
+        <register type="NOA" address="0x00009888" value="0x04531000" />
+        <register type="NOA" address="0x00009888" value="0x1190E000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x43900C00" />
+        <register type="NOA" address="0x00009888" value="0x45900002" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00001000" />
+        <register type="FLEX" address="0x0000E558" value="0x00003002" />
+        <register type="FLEX" address="0x0000E658" value="0x00005004" />
+        <register type="FLEX" address="0x0000E758" value="0x00011010" />
+        <register type="FLEX" address="0x0000E45C" value="0x00050012" />
+        <register type="FLEX" address="0x0000E55C" value="0x00052051" />
+        <register type="FLEX" address="0x0000E65C" value="0x00000008" />
+    </register_config>
+  </set>
+
+  <set name="Media Vme Pipe Gen9"
+       mdapi_supported_apis="MEDIA IO BB"
+       underscore_name="vme_pipe"
+       hw_config_guid="398a4268-ef6f-4ffc-b55f-3c7b5363ce61"
+       chipset="KBLGT2"
+       symbol_name="VMEPipe"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="EU Thread Occupancy"
+             description="The percentage of time in which hardware threads occupied EUs."
+             data_type="float"
+             max_equation="100"
+             equation="8 A 10 READ FMUL $EuThreadsCount FDIV $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_thread_occupancy"
+             units="percent"
+             symbol_name="EuThreadOccupancy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VME Busy"
+             description="The percentage of time in which VME (IME or CRE) was actively processing data."
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ B 3 READ FADD 2 FDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vme_busy"
+             units="percent"
+             symbol_name="VMEBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Overview System Batch Tier2"
+             mdapi_group="VME Pipe"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x141A5800" />
+        <register type="NOA" address="0x00009888" value="0x161A00C0" />
+        <register type="NOA" address="0x00009888" value="0x12180240" />
+        <register type="NOA" address="0x00009888" value="0x14180002" />
+        <register type="NOA" address="0x00009888" value="0x143A5800" />
+        <register type="NOA" address="0x00009888" value="0x163A00C0" />
+        <register type="NOA" address="0x00009888" value="0x12380240" />
+        <register type="NOA" address="0x00009888" value="0x14380002" />
+        <register type="NOA" address="0x00009888" value="0x002F1000" />
+        <register type="NOA" address="0x00009888" value="0x022F8000" />
+        <register type="NOA" address="0x00009888" value="0x042F3000" />
+        <register type="NOA" address="0x00009888" value="0x004C4000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C1500" />
+        <register type="NOA" address="0x00009888" value="0x000D2000" />
+        <register type="NOA" address="0x00009888" value="0x060D8000" />
+        <register type="NOA" address="0x00009888" value="0x080DA000" />
+        <register type="NOA" address="0x00009888" value="0x0A0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F0400" />
+        <register type="NOA" address="0x00009888" value="0x0E0F9500" />
+        <register type="NOA" address="0x00009888" value="0x100F002A" />
+        <register type="NOA" address="0x00009888" value="0x002C8000" />
+        <register type="NOA" address="0x00009888" value="0x0E2C8000" />
+        <register type="NOA" address="0x00009888" value="0x162C0A00" />
+        <register type="NOA" address="0x00009888" value="0x0A2DC000" />
+        <register type="NOA" address="0x00009888" value="0x0C2DC000" />
+        <register type="NOA" address="0x00009888" value="0x04193000" />
+        <register type="NOA" address="0x00009888" value="0x081A28C1" />
+        <register type="NOA" address="0x00009888" value="0x001A0000" />
+        <register type="NOA" address="0x00009888" value="0x00133000" />
+        <register type="NOA" address="0x00009888" value="0x0613C000" />
+        <register type="NOA" address="0x00009888" value="0x0813F000" />
+        <register type="NOA" address="0x00009888" value="0x00172000" />
+        <register type="NOA" address="0x00009888" value="0x06178000" />
+        <register type="NOA" address="0x00009888" value="0x0817A000" />
+        <register type="NOA" address="0x00009888" value="0x00180037" />
+        <register type="NOA" address="0x00009888" value="0x06180940" />
+        <register type="NOA" address="0x00009888" value="0x08180000" />
+        <register type="NOA" address="0x00009888" value="0x02180000" />
+        <register type="NOA" address="0x00009888" value="0x04183000" />
+        <register type="NOA" address="0x00009888" value="0x06393000" />
+        <register type="NOA" address="0x00009888" value="0x0C3A28C1" />
+        <register type="NOA" address="0x00009888" value="0x003A0000" />
+        <register type="NOA" address="0x00009888" value="0x0A33F000" />
+        <register type="NOA" address="0x00009888" value="0x0C33F000" />
+        <register type="NOA" address="0x00009888" value="0x0A37A000" />
+        <register type="NOA" address="0x00009888" value="0x0C37A000" />
+        <register type="NOA" address="0x00009888" value="0x0A380977" />
+        <register type="NOA" address="0x00009888" value="0x08380000" />
+        <register type="NOA" address="0x00009888" value="0x04380000" />
+        <register type="NOA" address="0x00009888" value="0x06383000" />
+        <register type="NOA" address="0x00009888" value="0x119000FF" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900040" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900800" />
+        <register type="NOA" address="0x00009888" value="0x47901000" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900844" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x30800000" />
+        <register type="OA" address="0x00002770" value="0x00100030" />
+        <register type="OA" address="0x00002774" value="0x0000FFF9" />
+        <register type="OA" address="0x00002778" value="0x00000002" />
+        <register type="OA" address="0x0000277C" value="0x0000FFFC" />
+        <register type="OA" address="0x00002780" value="0x00000002" />
+        <register type="OA" address="0x00002784" value="0x0000FFF3" />
+        <register type="OA" address="0x00002788" value="0x00100180" />
+        <register type="OA" address="0x0000278C" value="0x0000FFCF" />
+        <register type="OA" address="0x00002790" value="0x00000002" />
+        <register type="OA" address="0x00002794" value="0x0000FFCF" />
+        <register type="OA" address="0x00002798" value="0x00000002" />
+        <register type="OA" address="0x0000279C" value="0x0000FF3F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00008003" />
+    </register_config>
+  </set>
+
+  <set name="Gpu Rings Busyness"
+       mdapi_supported_apis="VK OGL OCL MEDIA IO BB"
+       underscore_name="gpu_busyness"
+       hw_config_guid="6c66fe6e-2988-454a-bfae-7fca3bbcbec2"
+       chipset="KBLGT2"
+       symbol_name="GpuBusyness"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="Vebox Ring Busy"
+             description="The percentage of time when vebox command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vebox_busy"
+             units="percent"
+             symbol_name="VeboxBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Render Ring Busy"
+             description="The percentage of time when render command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="render_busy"
+             units="percent"
+             symbol_name="RenderBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Vdbox0 Ring Busy"
+             description="The percentage of time when Vdbox0 command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vdbox0_busy"
+             units="percent"
+             symbol_name="Vdbox0Busy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Blitter Ring Busy"
+             description="The percentage of time when blitter command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="blitter_busy"
+             units="percent"
+             symbol_name="BlitterBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="AnyRingBusy"
+             description="The percentage of time when any command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="any_ring_busy"
+             units="percent"
+             symbol_name="AnyRingBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x13805800" />
+        <register type="NOA" address="0x00009888" value="0x05962C00" />
+        <register type="NOA" address="0x00009888" value="0x19950016" />
+        <register type="NOA" address="0x00009888" value="0x19C05800" />
+        <register type="NOA" address="0x00009888" value="0x07800035" />
+        <register type="NOA" address="0x00009888" value="0x11800000" />
+        <register type="NOA" address="0x00009888" value="0x1D810400" />
+        <register type="NOA" address="0x00009888" value="0x07960025" />
+        <register type="NOA" address="0x00009888" value="0x21960000" />
+        <register type="NOA" address="0x00009888" value="0x0B964000" />
+        <register type="NOA" address="0x00009888" value="0x1B930062" />
+        <register type="NOA" address="0x00009888" value="0x17948000" />
+        <register type="NOA" address="0x00009888" value="0x1B940008" />
+        <register type="NOA" address="0x00009888" value="0x05950075" />
+        <register type="NOA" address="0x00009888" value="0x1D950000" />
+        <register type="NOA" address="0x00009888" value="0x07E54000" />
+        <register type="NOA" address="0x00009888" value="0x09924000" />
+        <register type="NOA" address="0x00009888" value="0x05982000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B904000" />
+        <register type="NOA" address="0x00009888" value="0x1D908000" />
+        <register type="NOA" address="0x00009888" value="0x1F908000" />
+        <register type="NOA" address="0x00009888" value="0x09978000" />
+        <register type="NOA" address="0x00009888" value="0x05C08500" />
+        <register type="NOA" address="0x00009888" value="0x25C00000" />
+        <register type="NOA" address="0x00009888" value="0x1BC00000" />
+        <register type="NOA" address="0x00009888" value="0x0BC54000" />
+        <register type="NOA" address="0x00009888" value="0x11900000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x43900C60" />
+        <register type="NOA" address="0x00009888" value="0x45900040" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x10800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00078000" />
+        <register type="OA" address="0x00002774" value="0x00000FFF" />
+    </register_config>
+  </set>
+
+  <set name="MDAPI testing set Gen9.5"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="test_oa"
+       hw_config_guid="baa3c7e4-52b6-4b85-801e-465a94b746dd"
+       chipset="KBLGT2"
+       symbol_name="TestOa"
+       >
+    <counter name="TestCounter7"
+             description="HW test counter 7. Factor: 0.666"
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="counter7"
+             units="events"
+             symbol_name="Counter7"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="TestCounter8"
+             description="HW test counter 8. Should be equal to 1."
+             data_type="uint64"
+             equation="C 7 READ"
+             underscore_name="counter8"
+             units="events"
+             symbol_name="Counter8"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter4"
+             description="HW test counter 4. Factor: 0.333"
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="counter4"
+             units="events"
+             symbol_name="Counter4"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter5"
+             description="HW test counter 5. Factor: 0.333"
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="counter5"
+             units="events"
+             symbol_name="Counter5"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter6"
+             description="HW test counter 6. Factor: 0.166"
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="counter6"
+             units="events"
+             symbol_name="Counter6"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter3"
+             description="HW test counter 3. Factor: 0.5"
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="counter3"
+             units="events"
+             symbol_name="Counter3"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter0"
+             description="HW test counter 0. Factor: 0.0"
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="counter0"
+             units="events"
+             symbol_name="Counter0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter1"
+             description="HW test counter 1. Factor: 1.0"
+             data_type="uint64"
+             equation="B 1 READ"
+             underscore_name="counter1"
+             units="events"
+             symbol_name="Counter1"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter2"
+             description="HW test counter 2. Factor: 1.0"
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="counter2"
+             units="events"
+             symbol_name="Counter2"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x11810000" />
+        <register type="NOA" address="0x00009888" value="0x07810013" />
+        <register type="NOA" address="0x00009888" value="0x1F810000" />
+        <register type="NOA" address="0x00009888" value="0x1D810000" />
+        <register type="NOA" address="0x00009888" value="0x1B930040" />
+        <register type="NOA" address="0x00009888" value="0x07E54000" />
+        <register type="NOA" address="0x00009888" value="0x1F908000" />
+        <register type="NOA" address="0x00009888" value="0x11900000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x00000004" />
+        <register type="OA" address="0x00002774" value="0x00000000" />
+        <register type="OA" address="0x00002778" value="0x00000003" />
+        <register type="OA" address="0x0000277C" value="0x00000000" />
+        <register type="OA" address="0x00002780" value="0x00000007" />
+        <register type="OA" address="0x00002784" value="0x00000000" />
+        <register type="OA" address="0x00002788" value="0x00100002" />
+        <register type="OA" address="0x0000278C" value="0x0000FFF7" />
+        <register type="OA" address="0x00002790" value="0x00100002" />
+        <register type="OA" address="0x00002794" value="0x0000FFCF" />
+        <register type="OA" address="0x00002798" value="0x00100082" />
+        <register type="OA" address="0x0000279C" value="0x0000FFEF" />
+        <register type="OA" address="0x000027A0" value="0x001000C2" />
+        <register type="OA" address="0x000027A4" value="0x0000FFE7" />
+        <register type="OA" address="0x000027A8" value="0x00100001" />
+        <register type="OA" address="0x000027AC" value="0x0000FFE7" />
+    </register_config>
+  </set>
+
+  <set name="Metric set PMA Stall"
+       mdapi_supported_apis="VK OGL OGL4 OCL IO MEDIA"
+       underscore_name="pma__stall"
+       hw_config_guid="b49aa434-4958-4d98-9e6f-443ff27ca74d"
+       chipset="KBLGT2"
+       symbol_name="PMA_Stall"
+       >
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="STC PMA stall"
+             description="Percentage of time when stencil cache line and an overlapping pixel are causing stalls"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ B 1 READ FADD 2 FDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="stc_pma_stall"
+             units="percent"
+             symbol_name="StcPMAStall"
+             availability="$SliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_group="GPU/Stencil Cache"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x122D3080" />
+        <register type="NOA" address="0x00009888" value="0x000D2000" />
+        <register type="NOA" address="0x00009888" value="0x060D8000" />
+        <register type="NOA" address="0x00009888" value="0x080DA000" />
+        <register type="NOA" address="0x00009888" value="0x0A0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F0800" />
+        <register type="NOA" address="0x00009888" value="0x0E0FAA00" />
+        <register type="NOA" address="0x00009888" value="0x100F0002" />
+        <register type="NOA" address="0x00009888" value="0x002D0025" />
+        <register type="NOA" address="0x00009888" value="0x062D1300" />
+        <register type="NOA" address="0x00009888" value="0x082D16A4" />
+        <register type="NOA" address="0x00009888" value="0x0A2D162E" />
+        <register type="NOA" address="0x00009888" value="0x102D0000" />
+        <register type="NOA" address="0x00009888" value="0x1190003F" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900000" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900000" />
+        <register type="NOA" address="0x00009888" value="0x47900000" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x30800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00E00021" />
+        <register type="OA" address="0x00002774" value="0x0007FFF8" />
+        <register type="OA" address="0x00002778" value="0x07000101" />
+        <register type="OA" address="0x0000277C" value="0x0038FFC7" />
+    </register_config>
+  </set>
+
+</metrics>
diff --git a/lib/i915/perf-configs/oa-kblgt3.xml b/lib/i915/perf-configs/oa-kblgt3.xml
new file mode 100644
index 00000000..771c0c44
--- /dev/null
+++ b/lib/i915/perf-configs/oa-kblgt3.xml
@@ -0,0 +1,10933 @@
+<?xml version="1.0"?>
+<metrics version="1581935519" merge_md5="">
+  <set name="Render Metrics Basic Gen9"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="render_basic"
+       hw_config_guid="17b4f3e0-d578-4ae3-b7a8-98d756d1e0df"
+       chipset="KBLGT3"
+       symbol_name="RenderBasic"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Misses"
+             description="The total number of L3 misses."
+             data_type="uint64"
+             equation="C 4 READ"
+             underscore_name="l3_misses"
+             units="messages"
+             symbol_name="L3Misses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/TAG"
+             />
+    <counter name="GTI L3 Throughput"
+             description="The total number of GPU memory bytes transferred between L3 caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="$L3Misses 64 UMUL"
+             underscore_name="gti_l3_throughput"
+             units="bytes"
+             symbol_name="GtiL3Throughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Cache Misses"
+             description="The total number of sampler cache misses in all LODs in all sampler units."
+             data_type="uint64"
+             equation="B 4 READ B 5 READ UADD 8 UMUL"
+             underscore_name="sampler_l1_misses"
+             units="messages"
+             symbol_name="SamplerL1Misses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler 1 Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which Sampler 1 has been slowing down the pipe when processing EU requests."
+             data_type="float"
+             high_watermark="15"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="sampler1_bottleneck"
+             units="percent"
+             symbol_name="Sampler1Bottleneck"
+             availability="$SubsliceMask 0x12 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="L3 Sampler Throughput"
+             description="The total number of GPU memory bytes transferred between samplers and L3 caches."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="$SamplerL1Misses 64 UMUL"
+             underscore_name="l3_sampler_throughput"
+             units="bytes"
+             symbol_name="L3SamplerThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Sampler"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Sampler 0 Busy"
+             description="The percentage of time in which Sampler 0 has been processing EU requests."
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler0_busy"
+             units="percent"
+             symbol_name="Sampler0Busy"
+             availability="$SubsliceMask 0x09 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Sampler 1 Busy"
+             description="The percentage of time in which Sampler 1 has been processing EU requests."
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler1_busy"
+             units="percent"
+             symbol_name="Sampler1Busy"
+             availability="$SubsliceMask 0x12 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Samplers Busy"
+             description="The percentage of time in which samplers have been processing EU requests."
+             data_type="float"
+             max_equation="100"
+             equation="$Sampler0Busy $Sampler1Busy FMAX"
+             underscore_name="samplers_busy"
+             units="percent"
+             symbol_name="SamplersBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="GTI Fixed Pipe Throughput"
+             description="The total number of GPU memory bytes transferred between 3D Pipeline (Command Dispatch, Input Assembly and Stream Output) and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="B 6 READ B 7 READ UADD 64 UMUL"
+             underscore_name="gti_vf_throughput"
+             units="bytes"
+             symbol_name="GtiVfThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/3D Pipe"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler 0 Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which Sampler 0 has been slowing down the pipe when processing EU requests."
+             data_type="float"
+             high_watermark="15"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="sampler0_bottleneck"
+             units="percent"
+             symbol_name="Sampler0Bottleneck"
+             availability="$SubsliceMask 0x09 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="L3 Lookup Accesses w/o IC"
+             description="The total number of L3 cache lookup accesses w/o IC."
+             data_type="uint64"
+             equation="$SamplerL1Misses $ShaderMemoryAccesses UADD"
+             underscore_name="l3_lookups"
+             units="messages"
+             symbol_name="L3Lookups"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/TAG"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Read Throughput"
+             description="The total number of GPU memory bytes read from GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="C 6 READ 64 UMUL"
+             underscore_name="gti_read_throughput"
+             units="bytes"
+             symbol_name="GtiReadThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Depth Throughput"
+             description="The total number of GPU memory bytes transferred between depth caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 0 READ C 1 READ UADD 64 UMUL"
+             underscore_name="gti_depth_throughput"
+             units="bytes"
+             symbol_name="GtiDepthThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/Depth Cache"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Samplers Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which samplers have been slowing down the pipe when processing EU requests."
+             data_type="float"
+             high_watermark="15"
+             equation="$Sampler0Bottleneck $Sampler1Bottleneck FMAX"
+             max_equation="100"
+             underscore_name="sampler_bottleneck"
+             units="percent"
+             symbol_name="SamplerBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Indicate System Frame Batch Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="GTI HDC TLB Lookup Throughput"
+             description="The total number of GPU memory bytes transferred between GTI and HDC, when HDC is doing TLB lookups."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 5 READ 64 UMUL"
+             underscore_name="gti_hdc_lookups_throughput"
+             units="bytes"
+             symbol_name="GtiHdcLookupsThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI RCC Throughput"
+             description="The total number of GPU memory bytes transferred between render color caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 2 READ C 3 READ UADD 64 UMUL"
+             underscore_name="gti_rcc_throughput"
+             units="bytes"
+             symbol_name="GtiRccThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/Color Cache"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="GTI Write Throughput"
+             description="The total number of GPU memory bytes written to GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 32 UMUL"
+             equation="C 7 READ 64 UMUL"
+             underscore_name="gti_write_throughput"
+             units="bytes"
+             symbol_name="GtiWriteThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x166C01E0" />
+        <register type="NOA" address="0x00009888" value="0x12170280" />
+        <register type="NOA" address="0x00009888" value="0x12370280" />
+        <register type="NOA" address="0x00009888" value="0x16EC01E0" />
+        <register type="NOA" address="0x00009888" value="0x11930317" />
+        <register type="NOA" address="0x00009888" value="0x159303DF" />
+        <register type="NOA" address="0x00009888" value="0x3F900003" />
+        <register type="NOA" address="0x00009888" value="0x1A4E0380" />
+        <register type="NOA" address="0x00009888" value="0x0A6C0053" />
+        <register type="NOA" address="0x00009888" value="0x106C0000" />
+        <register type="NOA" address="0x00009888" value="0x1C6C0000" />
+        <register type="NOA" address="0x00009888" value="0x0A1B4000" />
+        <register type="NOA" address="0x00009888" value="0x1C1C0001" />
+        <register type="NOA" address="0x00009888" value="0x002F1000" />
+        <register type="NOA" address="0x00009888" value="0x042F1000" />
+        <register type="NOA" address="0x00009888" value="0x004C4000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C8400" />
+        <register type="NOA" address="0x00009888" value="0x0C4C0002" />
+        <register type="NOA" address="0x00009888" value="0x000D2000" />
+        <register type="NOA" address="0x00009888" value="0x060D8000" />
+        <register type="NOA" address="0x00009888" value="0x080DA000" />
+        <register type="NOA" address="0x00009888" value="0x0A0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F0400" />
+        <register type="NOA" address="0x00009888" value="0x0E0F6600" />
+        <register type="NOA" address="0x00009888" value="0x100F0001" />
+        <register type="NOA" address="0x00009888" value="0x002C8000" />
+        <register type="NOA" address="0x00009888" value="0x162CA200" />
+        <register type="NOA" address="0x00009888" value="0x062D8000" />
+        <register type="NOA" address="0x00009888" value="0x082D8000" />
+        <register type="NOA" address="0x00009888" value="0x00133000" />
+        <register type="NOA" address="0x00009888" value="0x08133000" />
+        <register type="NOA" address="0x00009888" value="0x00170020" />
+        <register type="NOA" address="0x00009888" value="0x08170021" />
+        <register type="NOA" address="0x00009888" value="0x10170000" />
+        <register type="NOA" address="0x00009888" value="0x0633C000" />
+        <register type="NOA" address="0x00009888" value="0x0833C000" />
+        <register type="NOA" address="0x00009888" value="0x06370800" />
+        <register type="NOA" address="0x00009888" value="0x08370840" />
+        <register type="NOA" address="0x00009888" value="0x10370000" />
+        <register type="NOA" address="0x00009888" value="0x1ACE0200" />
+        <register type="NOA" address="0x00009888" value="0x0AEC5300" />
+        <register type="NOA" address="0x00009888" value="0x10EC0000" />
+        <register type="NOA" address="0x00009888" value="0x1CEC0000" />
+        <register type="NOA" address="0x00009888" value="0x0A9B8000" />
+        <register type="NOA" address="0x00009888" value="0x1C9C0002" />
+        <register type="NOA" address="0x00009888" value="0x0CCC0002" />
+        <register type="NOA" address="0x00009888" value="0x0A8D8000" />
+        <register type="NOA" address="0x00009888" value="0x108F0001" />
+        <register type="NOA" address="0x00009888" value="0x16AC8000" />
+        <register type="NOA" address="0x00009888" value="0x0D933031" />
+        <register type="NOA" address="0x00009888" value="0x0F933E3F" />
+        <register type="NOA" address="0x00009888" value="0x01933D00" />
+        <register type="NOA" address="0x00009888" value="0x0393073C" />
+        <register type="NOA" address="0x00009888" value="0x0593000E" />
+        <register type="NOA" address="0x00009888" value="0x1D930000" />
+        <register type="NOA" address="0x00009888" value="0x19930000" />
+        <register type="NOA" address="0x00009888" value="0x1B930000" />
+        <register type="NOA" address="0x00009888" value="0x1D900157" />
+        <register type="NOA" address="0x00009888" value="0x1F900158" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x2B908000" />
+        <register type="NOA" address="0x00009888" value="0x2D908000" />
+        <register type="NOA" address="0x00009888" value="0x2F908000" />
+        <register type="NOA" address="0x00009888" value="0x31908000" />
+        <register type="NOA" address="0x00009888" value="0x15908000" />
+        <register type="NOA" address="0x00009888" value="0x17908000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B908000" />
+        <register type="NOA" address="0x00009888" value="0x1190003F" />
+        <register type="NOA" address="0x00009888" value="0x51902240" />
+        <register type="NOA" address="0x00009888" value="0x41900C00" />
+        <register type="NOA" address="0x00009888" value="0x55900242" />
+        <register type="NOA" address="0x00009888" value="0x45900084" />
+        <register type="NOA" address="0x00009888" value="0x47901400" />
+        <register type="NOA" address="0x00009888" value="0x57902220" />
+        <register type="NOA" address="0x00009888" value="0x49900C60" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900063" />
+        <register type="NOA" address="0x00009888" value="0x59900002" />
+        <register type="NOA" address="0x00009888" value="0x43900C63" />
+        <register type="NOA" address="0x00009888" value="0x53902222" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00222222" />
+    </register_config>
+  </set>
+
+  <set name="Compute Metrics Basic Gen9"
+       mdapi_supported_apis="VK OGL4 OCL IO BB"
+       underscore_name="compute_basic"
+       hw_config_guid="a5dc0bc5-d6fa-4f3a-9979-d3248c786042"
+       chipset="KBLGT3"
+       symbol_name="ComputeBasic"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Untyped Bytes Read"
+             description="The total number of typed memory bytes read via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="B 6 READ B 7 READ C 0 READ UADD UADD $EuSlicesTotalCount 64 UMUL UMUL"
+             underscore_name="untyped_bytes_read"
+             units="bytes"
+             symbol_name="UntypedBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Typed Bytes Written"
+             description="The total number of untyped memory bytes written via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="B 3 READ B 4 READ B 5 READ UADD UADD $EuSlicesTotalCount 64 UMUL UMUL"
+             underscore_name="typed_bytes_written"
+             units="bytes"
+             symbol_name="TypedBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu0_active"
+             units="percent"
+             symbol_name="Fpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active"
+             units="percent"
+             symbol_name="Fpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO OCL BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU AVG IPC Rate"
+             description="The average rate of IPC calculated for 2 FPU pipelines."
+             data_type="float"
+             max_equation="2"
+             equation="A 9 READ  A 10 READ  A 11 READ UADD  A 9 READ USUB FDIV 1 FADD"
+             underscore_name="eu_avg_ipc_rate"
+             units="number"
+             symbol_name="EuAvgIpcRate"
+             semantic_type="ratio"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO OCL BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO OCL BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Read Throughput"
+             description="The total number of GPU memory bytes read from GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 4 READ 64 UMUL"
+             underscore_name="gti_read_throughput"
+             units="bytes"
+             symbol_name="GtiReadThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Untyped Writes"
+             description="The total number of untyped memory bytes written via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 1 READ C 2 READ C 3 READ UADD UADD $EuSlicesTotalCount 64 UMUL UMUL"
+             underscore_name="untyped_bytes_written"
+             units="bytes"
+             symbol_name="UntypedBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO OCL BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="Typed Bytes Read"
+             description="The total number of typed memory bytes read via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="B 0 READ B 1 READ B 2 READ UADD UADD $EuSlicesTotalCount 64 UMUL UMUL"
+             underscore_name="typed_bytes_read"
+             units="bytes"
+             symbol_name="TypedBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="EU Thread Occupancy"
+             description="The percentage of time in which hardware threads occupied EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ 8 UMUL $EuCoresTotalCount UDIV $EuThreadsCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_thread_occupancy"
+             units="percent"
+             symbol_name="EuThreadOccupancy"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO OCL BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO OCL BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO OCL BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="GTI Write Throughput"
+             description="The total number of GPU memory bytes written to GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 32 UMUL"
+             equation="C 5 READ 64 UMUL"
+             underscore_name="gti_write_throughput"
+             units="bytes"
+             symbol_name="GtiWriteThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO OCL BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO OCL BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="EU Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_send_active"
+             units="percent"
+             symbol_name="EuSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO OCL BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x104F00E0" />
+        <register type="NOA" address="0x00009888" value="0x124F1C00" />
+        <register type="NOA" address="0x00009888" value="0x106C00E0" />
+        <register type="NOA" address="0x00009888" value="0x37906800" />
+        <register type="NOA" address="0x00009888" value="0x3F900003" />
+        <register type="NOA" address="0x00009888" value="0x004E8000" />
+        <register type="NOA" address="0x00009888" value="0x1A4E0820" />
+        <register type="NOA" address="0x00009888" value="0x1C4E0002" />
+        <register type="NOA" address="0x00009888" value="0x064F0900" />
+        <register type="NOA" address="0x00009888" value="0x084F0032" />
+        <register type="NOA" address="0x00009888" value="0x0A4F1891" />
+        <register type="NOA" address="0x00009888" value="0x0C4F0E00" />
+        <register type="NOA" address="0x00009888" value="0x0E4F003C" />
+        <register type="NOA" address="0x00009888" value="0x004F0D80" />
+        <register type="NOA" address="0x00009888" value="0x024F003B" />
+        <register type="NOA" address="0x00009888" value="0x006C0002" />
+        <register type="NOA" address="0x00009888" value="0x086C0100" />
+        <register type="NOA" address="0x00009888" value="0x0C6C000C" />
+        <register type="NOA" address="0x00009888" value="0x0E6C0B00" />
+        <register type="NOA" address="0x00009888" value="0x186C0000" />
+        <register type="NOA" address="0x00009888" value="0x1C6C0000" />
+        <register type="NOA" address="0x00009888" value="0x1E6C0000" />
+        <register type="NOA" address="0x00009888" value="0x001B4000" />
+        <register type="NOA" address="0x00009888" value="0x081B8000" />
+        <register type="NOA" address="0x00009888" value="0x0C1B4000" />
+        <register type="NOA" address="0x00009888" value="0x0E1B8000" />
+        <register type="NOA" address="0x00009888" value="0x101C8000" />
+        <register type="NOA" address="0x00009888" value="0x1A1C8000" />
+        <register type="NOA" address="0x00009888" value="0x1C1C0024" />
+        <register type="NOA" address="0x00009888" value="0x065B8000" />
+        <register type="NOA" address="0x00009888" value="0x085B4000" />
+        <register type="NOA" address="0x00009888" value="0x0A5BC000" />
+        <register type="NOA" address="0x00009888" value="0x0C5B8000" />
+        <register type="NOA" address="0x00009888" value="0x0E5B4000" />
+        <register type="NOA" address="0x00009888" value="0x005B8000" />
+        <register type="NOA" address="0x00009888" value="0x025B4000" />
+        <register type="NOA" address="0x00009888" value="0x1A5C6000" />
+        <register type="NOA" address="0x00009888" value="0x1C5C001B" />
+        <register type="NOA" address="0x00009888" value="0x125C8000" />
+        <register type="NOA" address="0x00009888" value="0x145C8000" />
+        <register type="NOA" address="0x00009888" value="0x004C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C2000" />
+        <register type="NOA" address="0x00009888" value="0x0C4C0208" />
+        <register type="NOA" address="0x00009888" value="0x000DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D8000" />
+        <register type="NOA" address="0x00009888" value="0x080DA000" />
+        <register type="NOA" address="0x00009888" value="0x0A0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0E0DA000" />
+        <register type="NOA" address="0x00009888" value="0x020D2000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F5400" />
+        <register type="NOA" address="0x00009888" value="0x0E0F5500" />
+        <register type="NOA" address="0x00009888" value="0x100F0155" />
+        <register type="NOA" address="0x00009888" value="0x002C8000" />
+        <register type="NOA" address="0x00009888" value="0x0E2CC000" />
+        <register type="NOA" address="0x00009888" value="0x162CFB00" />
+        <register type="NOA" address="0x00009888" value="0x182C00BE" />
+        <register type="NOA" address="0x00009888" value="0x022CC000" />
+        <register type="NOA" address="0x00009888" value="0x042CC000" />
+        <register type="NOA" address="0x00009888" value="0x19900157" />
+        <register type="NOA" address="0x00009888" value="0x1B900158" />
+        <register type="NOA" address="0x00009888" value="0x1D900105" />
+        <register type="NOA" address="0x00009888" value="0x1F900103" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x11900FFF" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900800" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900821" />
+        <register type="NOA" address="0x00009888" value="0x47900802" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900802" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900002" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x43900422" />
+        <register type="NOA" address="0x00009888" value="0x53904444" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00000003" />
+        <register type="FLEX" address="0x0000E658" value="0x00002001" />
+        <register type="FLEX" address="0x0000E758" value="0x00778008" />
+        <register type="FLEX" address="0x0000E45C" value="0x00088078" />
+        <register type="FLEX" address="0x0000E55C" value="0x00808708" />
+        <register type="FLEX" address="0x0000E65C" value="0x00222222" />
+    </register_config>
+  </set>
+
+  <set name="Render Metrics for 3D Pipeline Profile Gen9"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="render_pipe_profile"
+       hw_config_guid="c7c735f3-ce58-45cf-aa04-30b183f1faff"
+       chipset="KBLGT3"
+       symbol_name="RenderPipeProfile"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Bottleneck"
+             low_watermark="10"
+             description="The percentage of time in which vertex shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="30"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_bottleneck"
+             units="percent"
+             symbol_name="VsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Hi-Depth Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which early hierarchical depth test pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="hi_depth_bottleneck"
+             units="percent"
+             symbol_name="HiDepthBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which geometry shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gs_bottleneck"
+             units="percent"
+             symbol_name="GsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Geometry Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="BC Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which barycentric coordinates calculation pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="bc_bottleneck"
+             units="percent"
+             symbol_name="BcBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Barycentric Calc"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HS Stall"
+             description="The percentage of time in which hull stall pipeline stage was stalled."
+             data_type="float"
+             equation="C 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="hs_stall"
+             units="percent"
+             symbol_name="HsStall"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Hull Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="VF Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which vertex fetch pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="C 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vf_bottleneck"
+             units="percent"
+             symbol_name="VfBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Input Assembler"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Strip-Fans Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which strip-fans pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="10"
+             equation="B 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sf_bottleneck"
+             units="percent"
+             symbol_name="SfBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Strip-Fans"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SF Stall"
+             description="The percentage of time in which strip-fans pipeline stage was stalled."
+             data_type="float"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sf_stall"
+             units="percent"
+             symbol_name="SfStall"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Strip-Fans"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HS Bottleneck"
+             low_watermark="3"
+             description="The percentage of time in which hull shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="9"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="hs_bottleneck"
+             units="percent"
+             symbol_name="HsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Hull Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="CL Stall"
+             description="The percentage of time in which clipper pipeline stage was stalled."
+             data_type="float"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="cl_stall"
+             units="percent"
+             symbol_name="ClStall"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Clipper"
+             />
+    <counter name="SO Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which stream output pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="so_bottleneck"
+             units="percent"
+             symbol_name="SoBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Stream Output"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="DS Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which domain shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ds_bottleneck"
+             units="percent"
+             symbol_name="DsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Domain Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Clipper Bottleneck"
+             low_watermark="10"
+             description="The percentage of time in which clipper pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="30"
+             equation="B 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="cl_bottleneck"
+             units="percent"
+             symbol_name="ClBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Clipper"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Stall"
+             description="The percentage of time in which domain shader pipeline stage was stalled."
+             data_type="float"
+             equation="C 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ds_stall"
+             units="percent"
+             symbol_name="DsStall"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Domain Shader"
+             />
+    <counter name="Early Depth Bottleneck"
+             low_watermark="10"
+             description="The percentage of time in which early depth test pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="30"
+             equation="B 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="early_depth_bottleneck"
+             units="percent"
+             symbol_name="EarlyDepthBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="SO Stall"
+             description="The percentage of time in which stream-output pipeline stage was stalled."
+             data_type="float"
+             equation="C 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="so_stall"
+             units="percent"
+             symbol_name="SoStall"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Stream Output"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x0C0E001F" />
+        <register type="NOA" address="0x00009888" value="0x0A0F0000" />
+        <register type="NOA" address="0x00009888" value="0x10116800" />
+        <register type="NOA" address="0x00009888" value="0x178A03E0" />
+        <register type="NOA" address="0x00009888" value="0x11824C00" />
+        <register type="NOA" address="0x00009888" value="0x11830020" />
+        <register type="NOA" address="0x00009888" value="0x13840020" />
+        <register type="NOA" address="0x00009888" value="0x11850019" />
+        <register type="NOA" address="0x00009888" value="0x11860007" />
+        <register type="NOA" address="0x00009888" value="0x01870C40" />
+        <register type="NOA" address="0x00009888" value="0x17880000" />
+        <register type="NOA" address="0x00009888" value="0x022F4000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C0040" />
+        <register type="NOA" address="0x00009888" value="0x0C0D8000" />
+        <register type="NOA" address="0x00009888" value="0x040D4000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x020E5400" />
+        <register type="NOA" address="0x00009888" value="0x000E0000" />
+        <register type="NOA" address="0x00009888" value="0x080F0040" />
+        <register type="NOA" address="0x00009888" value="0x000F0000" />
+        <register type="NOA" address="0x00009888" value="0x100F0000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0040" />
+        <register type="NOA" address="0x00009888" value="0x0C2C8000" />
+        <register type="NOA" address="0x00009888" value="0x06104000" />
+        <register type="NOA" address="0x00009888" value="0x06110012" />
+        <register type="NOA" address="0x00009888" value="0x06131000" />
+        <register type="NOA" address="0x00009888" value="0x01898000" />
+        <register type="NOA" address="0x00009888" value="0x0D890100" />
+        <register type="NOA" address="0x00009888" value="0x03898000" />
+        <register type="NOA" address="0x00009888" value="0x09808000" />
+        <register type="NOA" address="0x00009888" value="0x0B808000" />
+        <register type="NOA" address="0x00009888" value="0x0380C000" />
+        <register type="NOA" address="0x00009888" value="0x0F8A0075" />
+        <register type="NOA" address="0x00009888" value="0x1D8A0000" />
+        <register type="NOA" address="0x00009888" value="0x118A8000" />
+        <register type="NOA" address="0x00009888" value="0x1B8A4000" />
+        <register type="NOA" address="0x00009888" value="0x138A8000" />
+        <register type="NOA" address="0x00009888" value="0x1D81A000" />
+        <register type="NOA" address="0x00009888" value="0x15818000" />
+        <register type="NOA" address="0x00009888" value="0x17818000" />
+        <register type="NOA" address="0x00009888" value="0x0B820030" />
+        <register type="NOA" address="0x00009888" value="0x07828000" />
+        <register type="NOA" address="0x00009888" value="0x0D824000" />
+        <register type="NOA" address="0x00009888" value="0x0F828000" />
+        <register type="NOA" address="0x00009888" value="0x05824000" />
+        <register type="NOA" address="0x00009888" value="0x0D830003" />
+        <register type="NOA" address="0x00009888" value="0x0583000C" />
+        <register type="NOA" address="0x00009888" value="0x09830000" />
+        <register type="NOA" address="0x00009888" value="0x03838000" />
+        <register type="NOA" address="0x00009888" value="0x07838000" />
+        <register type="NOA" address="0x00009888" value="0x0B840980" />
+        <register type="NOA" address="0x00009888" value="0x03844D80" />
+        <register type="NOA" address="0x00009888" value="0x11840000" />
+        <register type="NOA" address="0x00009888" value="0x09848000" />
+        <register type="NOA" address="0x00009888" value="0x09850080" />
+        <register type="NOA" address="0x00009888" value="0x03850003" />
+        <register type="NOA" address="0x00009888" value="0x01850000" />
+        <register type="NOA" address="0x00009888" value="0x07860000" />
+        <register type="NOA" address="0x00009888" value="0x0F860400" />
+        <register type="NOA" address="0x00009888" value="0x09870032" />
+        <register type="NOA" address="0x00009888" value="0x01888052" />
+        <register type="NOA" address="0x00009888" value="0x11880000" />
+        <register type="NOA" address="0x00009888" value="0x09884000" />
+        <register type="NOA" address="0x00009888" value="0x1B931001" />
+        <register type="NOA" address="0x00009888" value="0x1D930001" />
+        <register type="NOA" address="0x00009888" value="0x19934000" />
+        <register type="NOA" address="0x00009888" value="0x1B958000" />
+        <register type="NOA" address="0x00009888" value="0x1D950094" />
+        <register type="NOA" address="0x00009888" value="0x19958000" />
+        <register type="NOA" address="0x00009888" value="0x09E58000" />
+        <register type="NOA" address="0x00009888" value="0x0BE58000" />
+        <register type="NOA" address="0x00009888" value="0x03E5C000" />
+        <register type="NOA" address="0x00009888" value="0x0592C000" />
+        <register type="NOA" address="0x00009888" value="0x0B928000" />
+        <register type="NOA" address="0x00009888" value="0x0D924000" />
+        <register type="NOA" address="0x00009888" value="0x0F924000" />
+        <register type="NOA" address="0x00009888" value="0x11928000" />
+        <register type="NOA" address="0x00009888" value="0x1392C000" />
+        <register type="NOA" address="0x00009888" value="0x09924000" />
+        <register type="NOA" address="0x00009888" value="0x01985000" />
+        <register type="NOA" address="0x00009888" value="0x07988000" />
+        <register type="NOA" address="0x00009888" value="0x09981000" />
+        <register type="NOA" address="0x00009888" value="0x0B982000" />
+        <register type="NOA" address="0x00009888" value="0x0D982000" />
+        <register type="NOA" address="0x00009888" value="0x0F989000" />
+        <register type="NOA" address="0x00009888" value="0x05982000" />
+        <register type="NOA" address="0x00009888" value="0x13904000" />
+        <register type="NOA" address="0x00009888" value="0x21904000" />
+        <register type="NOA" address="0x00009888" value="0x23904000" />
+        <register type="NOA" address="0x00009888" value="0x25908000" />
+        <register type="NOA" address="0x00009888" value="0x27904000" />
+        <register type="NOA" address="0x00009888" value="0x29908000" />
+        <register type="NOA" address="0x00009888" value="0x2B904000" />
+        <register type="NOA" address="0x00009888" value="0x2F904000" />
+        <register type="NOA" address="0x00009888" value="0x31904000" />
+        <register type="NOA" address="0x00009888" value="0x15904000" />
+        <register type="NOA" address="0x00009888" value="0x17908000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B904000" />
+        <register type="NOA" address="0x00009888" value="0x1190C080" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900440" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900400" />
+        <register type="NOA" address="0x00009888" value="0x47900C21" />
+        <register type="NOA" address="0x00009888" value="0x57900400" />
+        <register type="NOA" address="0x00009888" value="0x49900042" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900024" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x43900841" />
+        <register type="NOA" address="0x00009888" value="0x53900400" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007FFEA" />
+        <register type="OA" address="0x00002774" value="0x00007FFC" />
+        <register type="OA" address="0x00002778" value="0x0007AFFA" />
+        <register type="OA" address="0x0000277C" value="0x0000F5FD" />
+        <register type="OA" address="0x00002780" value="0x00079FFA" />
+        <register type="OA" address="0x00002784" value="0x0000F3FB" />
+        <register type="OA" address="0x00002788" value="0x0007BF7A" />
+        <register type="OA" address="0x0000278C" value="0x0000F7E7" />
+        <register type="OA" address="0x00002790" value="0x0007FEFA" />
+        <register type="OA" address="0x00002794" value="0x0000F7CF" />
+        <register type="OA" address="0x00002798" value="0x00077FFA" />
+        <register type="OA" address="0x0000279C" value="0x0000EFDF" />
+        <register type="OA" address="0x000027A0" value="0x0006FFFA" />
+        <register type="OA" address="0x000027A4" value="0x0000CFBF" />
+        <register type="OA" address="0x000027A8" value="0x0003FFFA" />
+        <register type="OA" address="0x000027AC" value="0x00005F7F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00015014" />
+        <register type="FLEX" address="0x0000E658" value="0x00025024" />
+        <register type="FLEX" address="0x0000E758" value="0x00035034" />
+        <register type="FLEX" address="0x0000E45C" value="0x00045044" />
+        <register type="FLEX" address="0x0000E55C" value="0x00055054" />
+        <register type="FLEX" address="0x0000E65C" value="0x00065064" />
+    </register_config>
+  </set>
+
+  <set name="Memory Reads Distribution Gen9"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="memory_reads"
+       hw_config_guid="96ec2219-040b-428a-856a-6bc03363a057"
+       chipset="KBLGT3"
+       symbol_name="MemoryReads"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiL3Bank0Reads"
+             description="The total number of GTI memory reads from L3 Bank 0 (L3 Cache misses)."
+             data_type="uint64"
+             equation="C 4 READ"
+             underscore_name="gti_l3_bank0_reads"
+             units="messages"
+             symbol_name="GtiL3Bank0Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="GtiRingAccesses"
+             description="The total number of all accesses from GTI to the ring."
+             data_type="uint64"
+             equation="C 3 READ 2 UMUL"
+             underscore_name="gti_ring_accesses"
+             units="messages"
+             symbol_name="GtiRingAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="GtiL3Bank3Reads"
+             description="The total number of GTI memory reads from L3 Bank 3 (L3 Cache misses)."
+             data_type="uint64"
+             equation="C 7 READ"
+             underscore_name="gti_l3_bank3_reads"
+             units="messages"
+             symbol_name="GtiL3Bank3Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="GtiRsMemoryReads"
+             description="The total number of GTI memory reads from Resource Streamer."
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="gti_rs_memory_reads"
+             units="messages"
+             symbol_name="GtiRsMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Resource Streamer"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GtiHizMemoryReads"
+             description="The total number of GTI memory reads from Hierarchical Depth Cache (Hi-Depth Cache misses)."
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="gti_hiz_memory_reads"
+             units="messages"
+             symbol_name="GtiHizMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="GtiRccMemoryReads"
+             description="The total number of GTI memory reads from Render Color Cache (Render Color Cache misses)."
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="gti_rcc_memory_reads"
+             units="messages"
+             symbol_name="GtiRccMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Color Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiL3Bank1Reads"
+             description="The total number of GTI memory reads from L3 Bank 1 (L3 Cache misses)."
+             data_type="uint64"
+             equation="C 5 READ"
+             underscore_name="gti_l3_bank1_reads"
+             units="messages"
+             symbol_name="GtiL3Bank1Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiCmdStreamerMemoryReads"
+             description="The total number of GTI memory reads from Command Streamer."
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="gti_cmd_streamer_memory_reads"
+             units="messages"
+             symbol_name="GtiCmdStreamerMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Command Streamer"
+             />
+    <counter name="GtiL3Bank2Reads"
+             description="The total number of GTI memory reads from L3 Bank 2 (L3 Cache misses)."
+             data_type="uint64"
+             equation="C 6 READ"
+             underscore_name="gti_l3_bank2_reads"
+             units="messages"
+             symbol_name="GtiL3Bank2Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiMemoryReads"
+             description="The total number of GTI memory reads."
+             data_type="uint64"
+             equation="C 0 READ"
+             underscore_name="gti_memory_reads"
+             units="messages"
+             symbol_name="GtiMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="GtiRczMemoryReads"
+             description="The total number of GTI memory reads from Render Depth Cache (Render Depth Cache misses)."
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="gti_rcz_memory_reads"
+             units="messages"
+             symbol_name="GtiRczMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="GtiMscMemoryReads"
+             description="The total number of GTI memory reads from Multisampling Color Cache (Multisampling Color Cache misses)."
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="gti_msc_memory_reads"
+             units="messages"
+             symbol_name="GtiMscMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Color Cache"
+             />
+    <counter name="GtiVfMemoryReads"
+             description="The total number of GTI memory reads from Vertex Fetch."
+             data_type="uint64"
+             equation="B 1 READ"
+             underscore_name="gti_vf_memory_reads"
+             units="messages"
+             symbol_name="GtiVfMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Vertex Fetch"
+             />
+    <counter name="GtiStcMemoryReads"
+             description="The total number of GTI memory reads from Stencil Cache (Stencil Cache misses)."
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="gti_stc_memory_reads"
+             units="messages"
+             symbol_name="GtiStcMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiL3Reads"
+             description="The total number of GTI memory reads from L3 (L3 Cache misses)."
+             data_type="uint64"
+             equation="$GtiL3Bank0Reads $GtiL3Bank1Reads $GtiL3Bank2Reads $GtiL3Bank3Reads UADD UADD UADD"
+             underscore_name="gti_l3_reads"
+             units="messages"
+             symbol_name="GtiL3Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x11810C00" />
+        <register type="NOA" address="0x00009888" value="0x1381001A" />
+        <register type="NOA" address="0x00009888" value="0x37906800" />
+        <register type="NOA" address="0x00009888" value="0x3F900064" />
+        <register type="NOA" address="0x00009888" value="0x03811300" />
+        <register type="NOA" address="0x00009888" value="0x05811B12" />
+        <register type="NOA" address="0x00009888" value="0x0781001A" />
+        <register type="NOA" address="0x00009888" value="0x1F810000" />
+        <register type="NOA" address="0x00009888" value="0x17810000" />
+        <register type="NOA" address="0x00009888" value="0x19810000" />
+        <register type="NOA" address="0x00009888" value="0x1B810000" />
+        <register type="NOA" address="0x00009888" value="0x1D810000" />
+        <register type="NOA" address="0x00009888" value="0x1B930055" />
+        <register type="NOA" address="0x00009888" value="0x03E58000" />
+        <register type="NOA" address="0x00009888" value="0x05E5C000" />
+        <register type="NOA" address="0x00009888" value="0x07E54000" />
+        <register type="NOA" address="0x00009888" value="0x13900150" />
+        <register type="NOA" address="0x00009888" value="0x21900151" />
+        <register type="NOA" address="0x00009888" value="0x23900152" />
+        <register type="NOA" address="0x00009888" value="0x25900153" />
+        <register type="NOA" address="0x00009888" value="0x27900154" />
+        <register type="NOA" address="0x00009888" value="0x29900155" />
+        <register type="NOA" address="0x00009888" value="0x2B900156" />
+        <register type="NOA" address="0x00009888" value="0x2D900157" />
+        <register type="NOA" address="0x00009888" value="0x2F90015F" />
+        <register type="NOA" address="0x00009888" value="0x31900105" />
+        <register type="NOA" address="0x00009888" value="0x15900103" />
+        <register type="NOA" address="0x00009888" value="0x17900101" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B908000" />
+        <register type="NOA" address="0x00009888" value="0x1D908000" />
+        <register type="NOA" address="0x00009888" value="0x1F908000" />
+        <register type="NOA" address="0x00009888" value="0x11900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900C60" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900C00" />
+        <register type="NOA" address="0x00009888" value="0x47900C63" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900C63" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900063" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x43900003" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x0000272C" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002728" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x0000271C" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002718" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x0000274C" value="0x86543210" />
+        <register type="OA" address="0x00002748" value="0x86543210" />
+        <register type="OA" address="0x00002744" value="0x00006667" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x0000275C" value="0x86543210" />
+        <register type="OA" address="0x00002758" value="0x86543210" />
+        <register type="OA" address="0x00002754" value="0x00006465" />
+        <register type="OA" address="0x00002750" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007F81A" />
+        <register type="OA" address="0x00002774" value="0x0000FE00" />
+        <register type="OA" address="0x00002778" value="0x0007F82A" />
+        <register type="OA" address="0x0000277C" value="0x0000FE00" />
+        <register type="OA" address="0x00002780" value="0x0007F872" />
+        <register type="OA" address="0x00002784" value="0x0000FE00" />
+        <register type="OA" address="0x00002788" value="0x0007F8BA" />
+        <register type="OA" address="0x0000278C" value="0x0000FE00" />
+        <register type="OA" address="0x00002790" value="0x0007F87A" />
+        <register type="OA" address="0x00002794" value="0x0000FE00" />
+        <register type="OA" address="0x00002798" value="0x0007F8EA" />
+        <register type="OA" address="0x0000279C" value="0x0000FE00" />
+        <register type="OA" address="0x000027A0" value="0x0007F8E2" />
+        <register type="OA" address="0x000027A4" value="0x0000FE00" />
+        <register type="OA" address="0x000027A8" value="0x0007F8F2" />
+        <register type="OA" address="0x000027AC" value="0x0000FE00" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00015014" />
+        <register type="FLEX" address="0x0000E658" value="0x00025024" />
+        <register type="FLEX" address="0x0000E758" value="0x00035034" />
+        <register type="FLEX" address="0x0000E45C" value="0x00045044" />
+        <register type="FLEX" address="0x0000E55C" value="0x00055054" />
+        <register type="FLEX" address="0x0000E65C" value="0x00065064" />
+    </register_config>
+  </set>
+
+  <set name="Memory Writes Distribution Gen9"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="memory_writes"
+       hw_config_guid="03372b64-4996-4d3b-aa18-790e75eeb9c2"
+       chipset="KBLGT3"
+       symbol_name="MemoryWrites"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiMemoryWrites"
+             description="The total number of GTI memory writes."
+             data_type="uint64"
+             equation="C 0 READ"
+             underscore_name="gti_memory_writes"
+             units="messages"
+             symbol_name="GtiMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="GtiRingAccesses"
+             description="The total number of all GTI accesses to the ring."
+             data_type="uint64"
+             equation="C 3 READ 2 UMUL"
+             underscore_name="gti_ring_accesses"
+             units="messages"
+             symbol_name="GtiRingAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="GtiMscMemoryWrites"
+             description="The total number of GTI memory writes from Multisampling Color Cache (Multisampling Color Cache invalidations)."
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="gti_msc_memory_writes"
+             units="messages"
+             symbol_name="GtiMscMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Color Cache"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="GtiCmdStreamerMemoryWrites"
+             description="The total number of GTI memory writes from Command Streamer."
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="gti_cmd_streamer_memory_writes"
+             units="messages"
+             symbol_name="GtiCmdStreamerMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Command Streamer"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GtiL3Bank0Writes"
+             description="The total number of GTI memory writes from L3 Bank 0 (L3 Bank 0 invalidations)."
+             data_type="uint64"
+             equation="C 4 READ"
+             underscore_name="gti_l3_bank0_writes"
+             units="messages"
+             symbol_name="GtiL3Bank0Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiL3Bank1Writes"
+             description="The total number of GTI memory writes from L3 Bank 1 (L3 Bank 1 invalidations)."
+             data_type="uint64"
+             equation="C 5 READ"
+             underscore_name="gti_l3_bank1_writes"
+             units="messages"
+             symbol_name="GtiL3Bank1Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiL3Bank2Writes"
+             description="The total number of GTI memory writes from L3 Bank 2 (L3 Bank 2 invalidations)."
+             data_type="uint64"
+             equation="C 6 READ"
+             underscore_name="gti_l3_bank2_writes"
+             units="messages"
+             symbol_name="GtiL3Bank2Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiL3Bank3Writes"
+             description="The total number of GTI memory writes from L3 Bank 3 (L3 Bank 3 invalidations)."
+             data_type="uint64"
+             equation="C 7 READ"
+             underscore_name="gti_l3_bank3_writes"
+             units="messages"
+             symbol_name="GtiL3Bank3Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiL3Writes"
+             description="The total number of GTI memory writes from L3 (L3 invalidations)."
+             data_type="uint64"
+             equation="$GtiL3Bank0Writes $GtiL3Bank1Writes $GtiL3Bank2Writes $GtiL3Bank3Writes UADD UADD UADD"
+             underscore_name="gti_l3_writes"
+             units="messages"
+             symbol_name="GtiL3Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiRccMemoryWrites"
+             description="The total number of GTI memory writes from Render Color Cache (Render Color Cache invalidations)."
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="gti_rcc_memory_writes"
+             units="messages"
+             symbol_name="GtiRccMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Color Cache"
+             />
+    <counter name="GtiSoMemoryWrites"
+             description="The total number of GTI memory writes from Stream Output."
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="gti_so_memory_writes"
+             units="messages"
+             symbol_name="GtiSoMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Stream Output"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiStcMemoryWrites"
+             description="The total number of GTI memory writes from Stencil Cache."
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="gti_stc_memory_writes"
+             units="messages"
+             symbol_name="GtiStcMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="GtiRczMemoryWrites"
+             description="The total number of GTI memory writes from Render Depth Cache."
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="gti_rcz_memory_writes"
+             units="messages"
+             symbol_name="GtiRczMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="GtiHizMemoryWrites"
+             description="The total number of GTI memory writes from Hierarchical Depth Cache."
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="gti_hiz_memory_writes"
+             units="messages"
+             symbol_name="GtiHizMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x11810C00" />
+        <register type="NOA" address="0x00009888" value="0x1381001A" />
+        <register type="NOA" address="0x00009888" value="0x37906800" />
+        <register type="NOA" address="0x00009888" value="0x3F901000" />
+        <register type="NOA" address="0x00009888" value="0x03811300" />
+        <register type="NOA" address="0x00009888" value="0x05811B12" />
+        <register type="NOA" address="0x00009888" value="0x0781001A" />
+        <register type="NOA" address="0x00009888" value="0x1F810000" />
+        <register type="NOA" address="0x00009888" value="0x17810000" />
+        <register type="NOA" address="0x00009888" value="0x19810000" />
+        <register type="NOA" address="0x00009888" value="0x1B810000" />
+        <register type="NOA" address="0x00009888" value="0x1D810000" />
+        <register type="NOA" address="0x00009888" value="0x1B930055" />
+        <register type="NOA" address="0x00009888" value="0x03E58000" />
+        <register type="NOA" address="0x00009888" value="0x05E5C000" />
+        <register type="NOA" address="0x00009888" value="0x07E54000" />
+        <register type="NOA" address="0x00009888" value="0x13900160" />
+        <register type="NOA" address="0x00009888" value="0x21900161" />
+        <register type="NOA" address="0x00009888" value="0x23900162" />
+        <register type="NOA" address="0x00009888" value="0x25900163" />
+        <register type="NOA" address="0x00009888" value="0x27900164" />
+        <register type="NOA" address="0x00009888" value="0x29900165" />
+        <register type="NOA" address="0x00009888" value="0x2B900166" />
+        <register type="NOA" address="0x00009888" value="0x2D900167" />
+        <register type="NOA" address="0x00009888" value="0x2F900150" />
+        <register type="NOA" address="0x00009888" value="0x31900105" />
+        <register type="NOA" address="0x00009888" value="0x15900103" />
+        <register type="NOA" address="0x00009888" value="0x17900101" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B908000" />
+        <register type="NOA" address="0x00009888" value="0x1D908000" />
+        <register type="NOA" address="0x00009888" value="0x1F908000" />
+        <register type="NOA" address="0x00009888" value="0x11900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900C60" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900C00" />
+        <register type="NOA" address="0x00009888" value="0x47900C63" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900C63" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900063" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x43900003" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x0000272C" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002728" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x0000271C" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002718" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x0000274C" value="0x86543210" />
+        <register type="OA" address="0x00002748" value="0x86543210" />
+        <register type="OA" address="0x00002744" value="0x00006667" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x0000275C" value="0x86543210" />
+        <register type="OA" address="0x00002758" value="0x86543210" />
+        <register type="OA" address="0x00002754" value="0x00006465" />
+        <register type="OA" address="0x00002750" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007F81A" />
+        <register type="OA" address="0x00002774" value="0x0000FE00" />
+        <register type="OA" address="0x00002778" value="0x0007F82A" />
+        <register type="OA" address="0x0000277C" value="0x0000FE00" />
+        <register type="OA" address="0x00002780" value="0x0007F822" />
+        <register type="OA" address="0x00002784" value="0x0000FE00" />
+        <register type="OA" address="0x00002788" value="0x0007F8BA" />
+        <register type="OA" address="0x0000278C" value="0x0000FE00" />
+        <register type="OA" address="0x00002790" value="0x0007F87A" />
+        <register type="OA" address="0x00002794" value="0x0000FE00" />
+        <register type="OA" address="0x00002798" value="0x0007F8EA" />
+        <register type="OA" address="0x0000279C" value="0x0000FE00" />
+        <register type="OA" address="0x000027A0" value="0x0007F8E2" />
+        <register type="OA" address="0x000027A4" value="0x0000FE00" />
+        <register type="OA" address="0x000027A8" value="0x0007F8F2" />
+        <register type="OA" address="0x000027AC" value="0x0000FE00" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00015014" />
+        <register type="FLEX" address="0x0000E658" value="0x00025024" />
+        <register type="FLEX" address="0x0000E758" value="0x00035034" />
+        <register type="FLEX" address="0x0000E45C" value="0x00045044" />
+        <register type="FLEX" address="0x0000E55C" value="0x00055054" />
+        <register type="FLEX" address="0x0000E65C" value="0x00065064" />
+    </register_config>
+  </set>
+
+  <set name="Compute Metrics Extended Gen9"
+       mdapi_supported_apis="VK OGL4 OCL IO BB"
+       underscore_name="compute_extended"
+       hw_config_guid="31b4ce5a-bd61-4c1f-bb5d-f2e731412150"
+       chipset="KBLGT3"
+       symbol_name="ComputeExtended"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu0_active"
+             units="percent"
+             symbol_name="Fpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active"
+             units="percent"
+             symbol_name="Fpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU AVG IPC Rate"
+             description="The average rate of IPC calculated for 2 FPU pipelines."
+             data_type="float"
+             max_equation="2"
+             equation="A 9 READ  A 10 READ  A 11 READ UADD  A 9 READ USUB FDIV 1 FADD"
+             underscore_name="eu_avg_ipc_rate"
+             units="number"
+             symbol_name="EuAvgIpcRate"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Typed Writes 0"
+             description="The subslice 0 typed writes."
+             data_type="uint64"
+             equation="C 0 READ"
+             underscore_name="typed_writes0"
+             units="messages"
+             symbol_name="TypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuTypedAtomics0"
+             description="The subslice 0 EU Typed Atomics subslice 0."
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="eu_typed_atomics0"
+             units="messages"
+             symbol_name="EuTypedAtomics0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Typed Atomics 0"
+             description="The subslice 0 typed atomics."
+             data_type="uint64"
+             equation="C 4 READ"
+             underscore_name="typed_atomics0"
+             units="messages"
+             symbol_name="TypedAtomics0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="TypedAtomicsPerCacheLine"
+             description="The ratio of EU typed atomics requests to L3 cache line writes."
+             data_type="float"
+             equation="$EuTypedAtomics0 $TypedAtomics0 FDIV"
+             underscore_name="typed_atomics_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="TypedAtomicsPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuUntypedReads0"
+             description="The subslice 0 EU Untyped Reads subslice 0."
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="eu_untyped_reads0"
+             units="messages"
+             symbol_name="EuUntypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Untyped Writes 0"
+             description="The subslice 0 untyped writes (including SLM writes)."
+             data_type="uint64"
+             equation="C 1 READ"
+             underscore_name="untyped_writes0"
+             units="messages"
+             symbol_name="UntypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuUntypedAtomics0"
+             description="The subslice 0 EU Untyped Atomics subslice 0."
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="eu_untyped_atomics0"
+             units="messages"
+             symbol_name="EuUntypedAtomics0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuUntypedWrites0"
+             description="The subslice 0 EU Untyped Writes subslice 0."
+             data_type="uint64"
+             equation="B 1 READ"
+             underscore_name="eu_untyped_writes0"
+             units="messages"
+             symbol_name="EuUntypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuA64UntypedWrites0"
+             description="The subslice 0 EU A64 Untyped Writes subslice 0."
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="eu_a64_untyped_writes0"
+             units="messages"
+             symbol_name="EuA64UntypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="UntypedWritesPerCacheLine"
+             description="The ratio of EU untyped write requests to L3 cache line writes."
+             data_type="float"
+             equation="$EuUntypedWrites0 $EuA64UntypedWrites0 UADD $UntypedWrites0 FDIV"
+             underscore_name="untyped_writes_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="UntypedWritesPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EuTypedWrites0"
+             description="The subslice 0 EU Typed Writes subslice 0."
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="eu_typed_writes0"
+             units="messages"
+             symbol_name="EuTypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="TypedWritesPerCacheLine"
+             description="The ratio of EU typed write requests to L3 cache line writes."
+             data_type="float"
+             equation="$EuTypedWrites0 $TypedWrites0 FDIV"
+             underscore_name="typed_writes_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="TypedWritesPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Typed Reads 0"
+             description="The subslice 0 typed reads."
+             data_type="uint64"
+             equation="C 2 READ"
+             underscore_name="typed_reads0"
+             units="messages"
+             symbol_name="TypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Untyped Reads 0"
+             description="The subslice 0 untyped reads (including SLM reads)."
+             data_type="uint64"
+             equation="C 3 READ"
+             underscore_name="untyped_reads0"
+             units="messages"
+             symbol_name="UntypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuA64UntypedReads0"
+             description="The subslice 0 EU A64 Untyped Reads subslice 0."
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="eu_a64_untyped_reads0"
+             units="messages"
+             symbol_name="EuA64UntypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EU Thread Occupancy"
+             description="The percentage of time in which hardware threads occupied EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ 8 UMUL $EuCoresTotalCount UDIV $EuThreadsCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_thread_occupancy"
+             units="percent"
+             symbol_name="EuThreadOccupancy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EuTypedReads0"
+             description="The subslice 0 EU Typed Reads subslice 0."
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="eu_typed_reads0"
+             units="messages"
+             symbol_name="EuTypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="UntypedReadsPerCacheLine"
+             description="The ratio of EU untyped read requests to L3 cache line reads."
+             data_type="float"
+             equation="$EuUntypedReads0 $EuA64UntypedReads0 UADD $UntypedReads0 FDIV"
+             underscore_name="untyped_reads_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="UntypedReadsPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="TypedReadsPerCacheLine"
+             description="The ratio of EU typed read requests to L3 cache line reads."
+             data_type="float"
+             equation="$EuTypedReads0 $TypedReads0 FDIV"
+             underscore_name="typed_reads_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="TypedReadsPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="EU Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_send_active"
+             units="percent"
+             symbol_name="EuSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x106C00E0" />
+        <register type="NOA" address="0x00009888" value="0x141C8160" />
+        <register type="NOA" address="0x00009888" value="0x161C8015" />
+        <register type="NOA" address="0x00009888" value="0x181C0120" />
+        <register type="NOA" address="0x00009888" value="0x004E8000" />
+        <register type="NOA" address="0x00009888" value="0x0E4E8000" />
+        <register type="NOA" address="0x00009888" value="0x184E8000" />
+        <register type="NOA" address="0x00009888" value="0x1A4EAAA0" />
+        <register type="NOA" address="0x00009888" value="0x1C4E0002" />
+        <register type="NOA" address="0x00009888" value="0x024E8000" />
+        <register type="NOA" address="0x00009888" value="0x044E8000" />
+        <register type="NOA" address="0x00009888" value="0x064E8000" />
+        <register type="NOA" address="0x00009888" value="0x084E8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4E8000" />
+        <register type="NOA" address="0x00009888" value="0x0E6C0B01" />
+        <register type="NOA" address="0x00009888" value="0x006C0200" />
+        <register type="NOA" address="0x00009888" value="0x026C000C" />
+        <register type="NOA" address="0x00009888" value="0x1C6C0000" />
+        <register type="NOA" address="0x00009888" value="0x1E6C0000" />
+        <register type="NOA" address="0x00009888" value="0x1A6C0000" />
+        <register type="NOA" address="0x00009888" value="0x0E1BC000" />
+        <register type="NOA" address="0x00009888" value="0x001B8000" />
+        <register type="NOA" address="0x00009888" value="0x021BC000" />
+        <register type="NOA" address="0x00009888" value="0x001C0041" />
+        <register type="NOA" address="0x00009888" value="0x061C4200" />
+        <register type="NOA" address="0x00009888" value="0x081C4443" />
+        <register type="NOA" address="0x00009888" value="0x0A1C4645" />
+        <register type="NOA" address="0x00009888" value="0x0C1C7647" />
+        <register type="NOA" address="0x00009888" value="0x041C7357" />
+        <register type="NOA" address="0x00009888" value="0x1C1C0030" />
+        <register type="NOA" address="0x00009888" value="0x101C0000" />
+        <register type="NOA" address="0x00009888" value="0x1A1C0000" />
+        <register type="NOA" address="0x00009888" value="0x121C8000" />
+        <register type="NOA" address="0x00009888" value="0x004C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4CAA2A" />
+        <register type="NOA" address="0x00009888" value="0x0C4C02AA" />
+        <register type="NOA" address="0x00009888" value="0x084CA000" />
+        <register type="NOA" address="0x00009888" value="0x000DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D8000" />
+        <register type="NOA" address="0x00009888" value="0x080DA000" />
+        <register type="NOA" address="0x00009888" value="0x0A0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0E0DA000" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F5400" />
+        <register type="NOA" address="0x00009888" value="0x0E0F5515" />
+        <register type="NOA" address="0x00009888" value="0x100F0155" />
+        <register type="NOA" address="0x00009888" value="0x002C8000" />
+        <register type="NOA" address="0x00009888" value="0x0E2C8000" />
+        <register type="NOA" address="0x00009888" value="0x162CAA00" />
+        <register type="NOA" address="0x00009888" value="0x182C00AA" />
+        <register type="NOA" address="0x00009888" value="0x022C8000" />
+        <register type="NOA" address="0x00009888" value="0x042C8000" />
+        <register type="NOA" address="0x00009888" value="0x062C8000" />
+        <register type="NOA" address="0x00009888" value="0x082C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x11907FFF" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900040" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900802" />
+        <register type="NOA" address="0x00009888" value="0x47900842" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900842" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900000" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x43900800" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007FC2A" />
+        <register type="OA" address="0x00002774" value="0x0000BF00" />
+        <register type="OA" address="0x00002778" value="0x0007FC6A" />
+        <register type="OA" address="0x0000277C" value="0x0000BF00" />
+        <register type="OA" address="0x00002780" value="0x0007FC92" />
+        <register type="OA" address="0x00002784" value="0x0000BF00" />
+        <register type="OA" address="0x00002788" value="0x0007FCA2" />
+        <register type="OA" address="0x0000278C" value="0x0000BF00" />
+        <register type="OA" address="0x00002790" value="0x0007FC32" />
+        <register type="OA" address="0x00002794" value="0x0000BF00" />
+        <register type="OA" address="0x00002798" value="0x0007FC9A" />
+        <register type="OA" address="0x0000279C" value="0x0000BF00" />
+        <register type="OA" address="0x000027A0" value="0x0007FE6A" />
+        <register type="OA" address="0x000027A4" value="0x0000BF00" />
+        <register type="OA" address="0x000027A8" value="0x0007FE7A" />
+        <register type="OA" address="0x000027AC" value="0x0000BF00" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00000003" />
+        <register type="FLEX" address="0x0000E658" value="0x00002001" />
+        <register type="FLEX" address="0x0000E758" value="0x00778008" />
+        <register type="FLEX" address="0x0000E45C" value="0x00088078" />
+        <register type="FLEX" address="0x0000E55C" value="0x00808708" />
+        <register type="FLEX" address="0x0000E65C" value="0x00A08908" />
+    </register_config>
+  </set>
+
+  <set name="Compute Metrics L3 Cache Gen9"
+       mdapi_supported_apis="VK OGL4 OCL IO BB"
+       underscore_name="compute_l3_cache"
+       hw_config_guid="2ce0911a-27fc-4887-96f0-11084fa807c3"
+       chipset="KBLGT3"
+       symbol_name="ComputeL3Cache"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Bank 03 Accesses"
+             description="The total number of accesses to L3 Bank 03."
+             data_type="uint64"
+             equation="B 3 READ 2 UMUL"
+             underscore_name="l3_bank03_accesses"
+             units="messages"
+             symbol_name="L3Bank03Accesses"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="L3 Accesses"
+             description="The total number of L3 accesses from all entities."
+             data_type="uint64"
+             equation="C 0 READ C 1 READ B 2 READ B 3 READ UADD UADD UADD 2 UMUL"
+             underscore_name="l3_accesses"
+             units="messages"
+             symbol_name="L3Accesses"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Sampler Throughput"
+             description="The total number of GPU memory bytes transferred between samplers and L3 caches."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 29 READ 64 UMUL"
+             underscore_name="l3_sampler_throughput"
+             units="bytes"
+             symbol_name="L3SamplerThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Sampler"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu0_active"
+             units="percent"
+             symbol_name="Fpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active"
+             units="percent"
+             symbol_name="Fpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU AVG IPC Rate"
+             description="The average rate of IPC calculated for 2 FPU pipelines."
+             data_type="float"
+             max_equation="2"
+             equation="A 9 READ  A 10 READ  A 11 READ UADD  A 9 READ USUB FDIV 1 FADD"
+             underscore_name="eu_avg_ipc_rate"
+             units="number"
+             symbol_name="EuAvgIpcRate"
+             semantic_type="ratio"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Binary Instruction"
+             description="The percentage of time in which execution units were actively processing binary instructions on FPU0."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_binary_fpu0_instruction"
+             units="percent"
+             symbol_name="EuBinaryFpu0Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="EU FPU0 Hybrid Instruction"
+             description="The percentage of time in which execution units were actively processing hybrid instructions on FPU0."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_hybrid_fpu0_instruction"
+             units="percent"
+             symbol_name="EuHybridFpu0Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Misses"
+             description="The total number of L3 misses."
+             data_type="uint64"
+             equation="C 4 READ C 5 READ UADD"
+             underscore_name="l3_misses"
+             units="messages"
+             symbol_name="L3Misses"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/TAG"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="L3 Bank 00 Accesses"
+             description="The total number of accesses to L3 Bank 00."
+             data_type="uint64"
+             equation="C 0 READ 2 UMUL"
+             underscore_name="l3_bank00_accesses"
+             units="messages"
+             symbol_name="L3Bank00Accesses"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="EU FPU0 Move Instruction"
+             description="The percentage of time in which execution units were actively processing move instructions on FPU0."
+             data_type="float"
+             max_equation="100"
+             equation="A 19 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_move_fpu0_instruction"
+             units="percent"
+             symbol_name="EuMoveFpu0Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU FPU1 Hybrid Instruction"
+             description="The percentage of time in which execution units were actively processing hybrid instructions on FPU1."
+             data_type="float"
+             max_equation="100"
+             equation="A 14 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_hybrid_fpu1_instruction"
+             units="percent"
+             symbol_name="EuHybridFpu1Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Read Throughput"
+             description="The total number of GPU memory bytes read from GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="C 6 READ 64 UMUL"
+             underscore_name="gti_read_throughput"
+             units="bytes"
+             symbol_name="GtiReadThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI L3 Throughput"
+             description="The total number of GPU memory bytes transferred between L3 caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 4 READ C 5 READ UADD 64 UMUL"
+             underscore_name="gti_l3_throughput"
+             units="bytes"
+             symbol_name="GtiL3Throughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Bank 00 IC Accesses"
+             description="The total number of accesses to L3 Bank 00 from IC cache."
+             data_type="uint64"
+             equation="B 0 READ B 1 READ UADD 2 UMUL $L3Bank00Accesses UMIN"
+             underscore_name="l3_bank00_ic_accesses"
+             units="messages"
+             symbol_name="L3Bank00IcAccesses"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3/IC"
+             />
+    <counter name="L3 Bank 00 IC Hits"
+             description="The total number of hits in L3 Bank 00 from IC cache."
+             data_type="uint64"
+             equation="B 1 READ 2 UMUL $L3Bank00IcAccesses UMIN"
+             underscore_name="l3_bank00_ic_hits"
+             units="messages"
+             symbol_name="L3Bank00IcHits"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3/IC"
+             />
+    <counter name="Sampler Accesses"
+             description="The total number of messages send to samplers."
+             data_type="uint64"
+             equation="A 28 READ"
+             underscore_name="sampler_accesses"
+             units="messages"
+             symbol_name="SamplerAccesses"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler"
+             />
+    <counter name="L3 Bank 01 Accesses"
+             description="The total number of accesses to L3 Bank 01."
+             data_type="uint64"
+             equation="C 1 READ 2 UMUL"
+             underscore_name="l3_bank01_accesses"
+             units="messages"
+             symbol_name="L3Bank01Accesses"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Ternary Instruction"
+             description="The percentage of time in which execution units were actively processing ternary instructions on FPU0."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_ternary_fpu0_instruction"
+             units="percent"
+             symbol_name="EuTernaryFpu0Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU FPU1 Move Instruction"
+             description="The percentage of time in which execution units were actively processing move instructions on FPU1."
+             data_type="float"
+             max_equation="100"
+             equation="A 20 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_move_fpu1_instruction"
+             units="percent"
+             symbol_name="EuMoveFpu1Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="L3 Bank 02 Accesses"
+             description="The total number of accesses to L3 Bank 02."
+             data_type="uint64"
+             equation="B 2 READ 2 UMUL"
+             underscore_name="l3_bank02_accesses"
+             units="messages"
+             symbol_name="L3Bank02Accesses"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="L3 Total Throughput"
+             description="The total number of GPU memory bytes transferred via L3."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="$L3Accesses 64 UMUL"
+             underscore_name="l3_total_throughput"
+             units="bytes"
+             symbol_name="L3TotalThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Write Throughput"
+             description="The total number of GPU memory bytes written to GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 32 UMUL"
+             equation="C 7 READ 64 UMUL"
+             underscore_name="gti_write_throughput"
+             units="bytes"
+             symbol_name="GtiWriteThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="EU FPU1 Binary Instruction"
+             description="The percentage of time in which execution units were actively processing binary instructions on FPU1."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_binary_fpu1_instruction"
+             units="percent"
+             symbol_name="EuBinaryFpu1Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Ternary Instruction"
+             description="The percentage of time in which execution units were actively processing ternary instructions on FPU1."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_ternary_fpu1_instruction"
+             units="percent"
+             symbol_name="EuTernaryFpu1Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_send_active"
+             units="percent"
+             symbol_name="EuSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x166C0760" />
+        <register type="NOA" address="0x00009888" value="0x1593001E" />
+        <register type="NOA" address="0x00009888" value="0x3F900003" />
+        <register type="NOA" address="0x00009888" value="0x004E8000" />
+        <register type="NOA" address="0x00009888" value="0x0E4E8000" />
+        <register type="NOA" address="0x00009888" value="0x184E8000" />
+        <register type="NOA" address="0x00009888" value="0x1A4E8020" />
+        <register type="NOA" address="0x00009888" value="0x1C4E0002" />
+        <register type="NOA" address="0x00009888" value="0x006C0051" />
+        <register type="NOA" address="0x00009888" value="0x066C5000" />
+        <register type="NOA" address="0x00009888" value="0x086C5C5D" />
+        <register type="NOA" address="0x00009888" value="0x0E6C5E5F" />
+        <register type="NOA" address="0x00009888" value="0x106C0000" />
+        <register type="NOA" address="0x00009888" value="0x186C0000" />
+        <register type="NOA" address="0x00009888" value="0x1C6C0000" />
+        <register type="NOA" address="0x00009888" value="0x1E6C0000" />
+        <register type="NOA" address="0x00009888" value="0x001B4000" />
+        <register type="NOA" address="0x00009888" value="0x061B8000" />
+        <register type="NOA" address="0x00009888" value="0x081BC000" />
+        <register type="NOA" address="0x00009888" value="0x0E1BC000" />
+        <register type="NOA" address="0x00009888" value="0x101C8000" />
+        <register type="NOA" address="0x00009888" value="0x1A1CE000" />
+        <register type="NOA" address="0x00009888" value="0x1C1C0030" />
+        <register type="NOA" address="0x00009888" value="0x004C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C2A00" />
+        <register type="NOA" address="0x00009888" value="0x0C4C0280" />
+        <register type="NOA" address="0x00009888" value="0x000D2000" />
+        <register type="NOA" address="0x00009888" value="0x060D8000" />
+        <register type="NOA" address="0x00009888" value="0x080DA000" />
+        <register type="NOA" address="0x00009888" value="0x0E0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F0400" />
+        <register type="NOA" address="0x00009888" value="0x0E0F1500" />
+        <register type="NOA" address="0x00009888" value="0x100F0140" />
+        <register type="NOA" address="0x00009888" value="0x002C8000" />
+        <register type="NOA" address="0x00009888" value="0x0E2C8000" />
+        <register type="NOA" address="0x00009888" value="0x162C0A00" />
+        <register type="NOA" address="0x00009888" value="0x182C00A0" />
+        <register type="NOA" address="0x00009888" value="0x03933300" />
+        <register type="NOA" address="0x00009888" value="0x05930032" />
+        <register type="NOA" address="0x00009888" value="0x11930000" />
+        <register type="NOA" address="0x00009888" value="0x1B930000" />
+        <register type="NOA" address="0x00009888" value="0x1D900157" />
+        <register type="NOA" address="0x00009888" value="0x1F900158" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B908000" />
+        <register type="NOA" address="0x00009888" value="0x1190030F" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900000" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900021" />
+        <register type="NOA" address="0x00009888" value="0x47900000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900000" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x53904444" />
+        <register type="NOA" address="0x00009888" value="0x43900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x30800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x30800000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007FFFA" />
+        <register type="OA" address="0x00002774" value="0x0000FEFE" />
+        <register type="OA" address="0x00002778" value="0x0007FFFA" />
+        <register type="OA" address="0x0000277C" value="0x0000FEFD" />
+        <register type="OA" address="0x00002790" value="0x0007FFFA" />
+        <register type="OA" address="0x00002794" value="0x0000FBEF" />
+        <register type="OA" address="0x00002798" value="0x0007FFFA" />
+        <register type="OA" address="0x0000279C" value="0x0000FBDF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00000003" />
+        <register type="FLEX" address="0x0000E658" value="0x00002001" />
+        <register type="FLEX" address="0x0000E758" value="0x00101100" />
+        <register type="FLEX" address="0x0000E45C" value="0x00201200" />
+        <register type="FLEX" address="0x0000E55C" value="0x00301300" />
+        <register type="FLEX" address="0x0000E65C" value="0x00401400" />
+    </register_config>
+  </set>
+
+  <set name="Metric set HDCAndSF"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="hdc_and_sf"
+       hw_config_guid="b128f45f-bfa2-4991-aadc-05be7898e398"
+       chipset="KBLGT3"
+       symbol_name="HDCAndSF"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="Polygon Data Ready"
+             description="The percentage of time in which geometry pipeline output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="poly_data_ready"
+             units="percent"
+             symbol_name="PolyDataReady"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe/Strip-Fans"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="HDC stalled by L3 (s0.ss1)"
+             description="Percentage of time when HDC has messges to L3, but it's stalled due to lack of credits (s0.ss1)"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ C 4 READ USUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader01_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader01AccessStalledOnL3"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="HDC stalled by L3 (s0.ss2)"
+             description="Percentage of time when HDC has messges to L3, but it's stalled due to lack of credits (s0.ss2)"
+             data_type="float"
+             max_equation="100"
+             equation="C 3 READ C 2 READ USUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader02_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader02AccessStalledOnL3"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="HDC stalled by L3 (s0.ss0)"
+             description="Percentage of time when HDC has messges to L3, but it's stalled due to lack of credits (s0.ss0)"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ C 6 READ USUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader00_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader00AccessStalledOnL3"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x104F0232" />
+        <register type="NOA" address="0x00009888" value="0x124F4640" />
+        <register type="NOA" address="0x00009888" value="0x106C0232" />
+        <register type="NOA" address="0x00009888" value="0x11834400" />
+        <register type="NOA" address="0x00009888" value="0x0A4E8000" />
+        <register type="NOA" address="0x00009888" value="0x0C4E8000" />
+        <register type="NOA" address="0x00009888" value="0x004F1880" />
+        <register type="NOA" address="0x00009888" value="0x024F08BB" />
+        <register type="NOA" address="0x00009888" value="0x044F001B" />
+        <register type="NOA" address="0x00009888" value="0x046C0100" />
+        <register type="NOA" address="0x00009888" value="0x066C000B" />
+        <register type="NOA" address="0x00009888" value="0x1A6C0000" />
+        <register type="NOA" address="0x00009888" value="0x041B8000" />
+        <register type="NOA" address="0x00009888" value="0x061B4000" />
+        <register type="NOA" address="0x00009888" value="0x1A1C1800" />
+        <register type="NOA" address="0x00009888" value="0x005B8000" />
+        <register type="NOA" address="0x00009888" value="0x025BC000" />
+        <register type="NOA" address="0x00009888" value="0x045B4000" />
+        <register type="NOA" address="0x00009888" value="0x125C8000" />
+        <register type="NOA" address="0x00009888" value="0x145C8000" />
+        <register type="NOA" address="0x00009888" value="0x165C8000" />
+        <register type="NOA" address="0x00009888" value="0x185C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C00A0" />
+        <register type="NOA" address="0x00009888" value="0x000D8000" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F5000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0055" />
+        <register type="NOA" address="0x00009888" value="0x022CC000" />
+        <register type="NOA" address="0x00009888" value="0x042CC000" />
+        <register type="NOA" address="0x00009888" value="0x062CC000" />
+        <register type="NOA" address="0x00009888" value="0x082CC000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0F828000" />
+        <register type="NOA" address="0x00009888" value="0x0F8305C0" />
+        <register type="NOA" address="0x00009888" value="0x09830000" />
+        <register type="NOA" address="0x00009888" value="0x07830000" />
+        <register type="NOA" address="0x00009888" value="0x1D950080" />
+        <register type="NOA" address="0x00009888" value="0x13928000" />
+        <register type="NOA" address="0x00009888" value="0x0F988000" />
+        <register type="NOA" address="0x00009888" value="0x31904000" />
+        <register type="NOA" address="0x00009888" value="0x1190FC00" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900040" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900800" />
+        <register type="NOA" address="0x00009888" value="0x43900842" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x10800000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00000002" />
+        <register type="OA" address="0x00002774" value="0x0000FDFF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set L3_1"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="l3_1"
+       hw_config_guid="f3566b55-9c13-47bf-8327-4a887af75262"
+       chipset="KBLGT3"
+       symbol_name="L3_1"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank1 Active"
+             description="The percentage of time in which slice0 L3 bank1 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank1_active"
+             units="percent"
+             symbol_name="L30Bank1Active"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="Slice0 L3 Bank1 Stalled"
+             description="The percentage of time in which slice0 L3 bank1 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank1_stalled"
+             units="percent"
+             symbol_name="L30Bank1Stalled"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank0 Active"
+             description="The percentage of time in which slice0 L3 bank0 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank0_active"
+             units="percent"
+             symbol_name="L30Bank0Active"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank0 Stalled"
+             description="The percentage of time in which slice0 L3 bank0 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank0_stalled"
+             units="percent"
+             symbol_name="L30Bank0Stalled"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x126C7B40" />
+        <register type="NOA" address="0x00009888" value="0x166C0020" />
+        <register type="NOA" address="0x00009888" value="0x0A603444" />
+        <register type="NOA" address="0x00009888" value="0x0A613400" />
+        <register type="NOA" address="0x00009888" value="0x1A4EA800" />
+        <register type="NOA" address="0x00009888" value="0x1C4E0002" />
+        <register type="NOA" address="0x00009888" value="0x024E8000" />
+        <register type="NOA" address="0x00009888" value="0x044E8000" />
+        <register type="NOA" address="0x00009888" value="0x064E8000" />
+        <register type="NOA" address="0x00009888" value="0x084E8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4E8000" />
+        <register type="NOA" address="0x00009888" value="0x064F4000" />
+        <register type="NOA" address="0x00009888" value="0x0C6C5327" />
+        <register type="NOA" address="0x00009888" value="0x0E6C5425" />
+        <register type="NOA" address="0x00009888" value="0x006C2A00" />
+        <register type="NOA" address="0x00009888" value="0x026C285B" />
+        <register type="NOA" address="0x00009888" value="0x046C005C" />
+        <register type="NOA" address="0x00009888" value="0x106C0000" />
+        <register type="NOA" address="0x00009888" value="0x1C6C0000" />
+        <register type="NOA" address="0x00009888" value="0x1E6C0000" />
+        <register type="NOA" address="0x00009888" value="0x1A6C0800" />
+        <register type="NOA" address="0x00009888" value="0x0C1BC000" />
+        <register type="NOA" address="0x00009888" value="0x0E1BC000" />
+        <register type="NOA" address="0x00009888" value="0x001B8000" />
+        <register type="NOA" address="0x00009888" value="0x021BC000" />
+        <register type="NOA" address="0x00009888" value="0x041BC000" />
+        <register type="NOA" address="0x00009888" value="0x1C1C003C" />
+        <register type="NOA" address="0x00009888" value="0x121C8000" />
+        <register type="NOA" address="0x00009888" value="0x141C8000" />
+        <register type="NOA" address="0x00009888" value="0x161C8000" />
+        <register type="NOA" address="0x00009888" value="0x181C8000" />
+        <register type="NOA" address="0x00009888" value="0x1A1C0800" />
+        <register type="NOA" address="0x00009888" value="0x065B4000" />
+        <register type="NOA" address="0x00009888" value="0x1A5C1000" />
+        <register type="NOA" address="0x00009888" value="0x10600000" />
+        <register type="NOA" address="0x00009888" value="0x04600000" />
+        <register type="NOA" address="0x00009888" value="0x0C610044" />
+        <register type="NOA" address="0x00009888" value="0x10610000" />
+        <register type="NOA" address="0x00009888" value="0x06610000" />
+        <register type="NOA" address="0x00009888" value="0x0C4C02A8" />
+        <register type="NOA" address="0x00009888" value="0x084CA000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C002A" />
+        <register type="NOA" address="0x00009888" value="0x0C0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0E0DA000" />
+        <register type="NOA" address="0x00009888" value="0x000D8000" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x100F0154" />
+        <register type="NOA" address="0x00009888" value="0x0C0F5000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0055" />
+        <register type="NOA" address="0x00009888" value="0x182C00AA" />
+        <register type="NOA" address="0x00009888" value="0x022C8000" />
+        <register type="NOA" address="0x00009888" value="0x042C8000" />
+        <register type="NOA" address="0x00009888" value="0x062C8000" />
+        <register type="NOA" address="0x00009888" value="0x082C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C2CC000" />
+        <register type="NOA" address="0x00009888" value="0x1190FFC0" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900420" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900021" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900400" />
+        <register type="NOA" address="0x00009888" value="0x43900421" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900040" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002770" value="0x00100070" />
+        <register type="OA" address="0x00002774" value="0x0000FFF1" />
+        <register type="OA" address="0x00002778" value="0x00014002" />
+        <register type="OA" address="0x0000277C" value="0x0000C3FF" />
+        <register type="OA" address="0x00002780" value="0x00010002" />
+        <register type="OA" address="0x00002784" value="0x0000C7FF" />
+        <register type="OA" address="0x00002788" value="0x00004002" />
+        <register type="OA" address="0x0000278C" value="0x0000D3FF" />
+        <register type="OA" address="0x00002790" value="0x00100700" />
+        <register type="OA" address="0x00002794" value="0x0000FF1F" />
+        <register type="OA" address="0x00002798" value="0x00001402" />
+        <register type="OA" address="0x0000279C" value="0x0000FC3F" />
+        <register type="OA" address="0x000027A0" value="0x00001002" />
+        <register type="OA" address="0x000027A4" value="0x0000FC7F" />
+        <register type="OA" address="0x000027A8" value="0x00000402" />
+        <register type="OA" address="0x000027AC" value="0x0000FD3F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set L3_2"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="l3_2"
+       hw_config_guid="7b21aa68-9076-4ab4-8a84-e45a06c8eac6"
+       chipset="KBLGT3"
+       symbol_name="L3_2"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank2 Stalled"
+             description="The percentage of time in which slice0 L3 bank2 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank2_stalled"
+             units="percent"
+             symbol_name="L30Bank2Stalled"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank2 Active"
+             description="The percentage of time in which slice0 L3 bank2 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank2_active"
+             units="percent"
+             symbol_name="L30Bank2Active"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x126C02E0" />
+        <register type="NOA" address="0x00009888" value="0x146C0001" />
+        <register type="NOA" address="0x00009888" value="0x0A623400" />
+        <register type="NOA" address="0x00009888" value="0x044E8000" />
+        <register type="NOA" address="0x00009888" value="0x064E8000" />
+        <register type="NOA" address="0x00009888" value="0x084E8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4E8000" />
+        <register type="NOA" address="0x00009888" value="0x064F4000" />
+        <register type="NOA" address="0x00009888" value="0x026C3324" />
+        <register type="NOA" address="0x00009888" value="0x046C3422" />
+        <register type="NOA" address="0x00009888" value="0x106C0000" />
+        <register type="NOA" address="0x00009888" value="0x1A6C0000" />
+        <register type="NOA" address="0x00009888" value="0x021BC000" />
+        <register type="NOA" address="0x00009888" value="0x041BC000" />
+        <register type="NOA" address="0x00009888" value="0x141C8000" />
+        <register type="NOA" address="0x00009888" value="0x161C8000" />
+        <register type="NOA" address="0x00009888" value="0x181C8000" />
+        <register type="NOA" address="0x00009888" value="0x1A1C0800" />
+        <register type="NOA" address="0x00009888" value="0x065B4000" />
+        <register type="NOA" address="0x00009888" value="0x1A5C1000" />
+        <register type="NOA" address="0x00009888" value="0x06614000" />
+        <register type="NOA" address="0x00009888" value="0x0C620044" />
+        <register type="NOA" address="0x00009888" value="0x10620000" />
+        <register type="NOA" address="0x00009888" value="0x06620000" />
+        <register type="NOA" address="0x00009888" value="0x084C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C002A" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F4000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0055" />
+        <register type="NOA" address="0x00009888" value="0x042C8000" />
+        <register type="NOA" address="0x00009888" value="0x062C8000" />
+        <register type="NOA" address="0x00009888" value="0x082C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C2CC000" />
+        <register type="NOA" address="0x00009888" value="0x1190F800" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x43900000" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00100070" />
+        <register type="OA" address="0x00002774" value="0x0000FFF1" />
+        <register type="OA" address="0x00002778" value="0x00028002" />
+        <register type="OA" address="0x0000277C" value="0x000087FF" />
+        <register type="OA" address="0x00002780" value="0x00020002" />
+        <register type="OA" address="0x00002784" value="0x00008FFF" />
+        <register type="OA" address="0x00002788" value="0x00008002" />
+        <register type="OA" address="0x0000278C" value="0x0000A7FF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set L3_3"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="l3_3"
+       hw_config_guid="71b4b9dd-ae28-48ce-9a1a-5431e1f23afd"
+       chipset="KBLGT3"
+       symbol_name="L3_3"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Slice0 L3 Bank3 Stalled"
+             description="The percentage of time in which slice0 L3 bank3 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank3_stalled"
+             units="percent"
+             symbol_name="L30Bank3Stalled"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank3 Active"
+             description="The percentage of time in which slice0 L3 bank3 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank3_active"
+             units="percent"
+             symbol_name="L30Bank3Active"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x126C4E80" />
+        <register type="NOA" address="0x00009888" value="0x146C0000" />
+        <register type="NOA" address="0x00009888" value="0x0A633400" />
+        <register type="NOA" address="0x00009888" value="0x044E8000" />
+        <register type="NOA" address="0x00009888" value="0x064E8000" />
+        <register type="NOA" address="0x00009888" value="0x084E8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4E8000" />
+        <register type="NOA" address="0x00009888" value="0x0C4E8000" />
+        <register type="NOA" address="0x00009888" value="0x026C3321" />
+        <register type="NOA" address="0x00009888" value="0x046C342F" />
+        <register type="NOA" address="0x00009888" value="0x106C0000" />
+        <register type="NOA" address="0x00009888" value="0x1A6C2000" />
+        <register type="NOA" address="0x00009888" value="0x021BC000" />
+        <register type="NOA" address="0x00009888" value="0x041BC000" />
+        <register type="NOA" address="0x00009888" value="0x061B4000" />
+        <register type="NOA" address="0x00009888" value="0x141C8000" />
+        <register type="NOA" address="0x00009888" value="0x161C8000" />
+        <register type="NOA" address="0x00009888" value="0x181C8000" />
+        <register type="NOA" address="0x00009888" value="0x1A1C1800" />
+        <register type="NOA" address="0x00009888" value="0x06604000" />
+        <register type="NOA" address="0x00009888" value="0x0C630044" />
+        <register type="NOA" address="0x00009888" value="0x10630000" />
+        <register type="NOA" address="0x00009888" value="0x06630000" />
+        <register type="NOA" address="0x00009888" value="0x084C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C00AA" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F4000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0055" />
+        <register type="NOA" address="0x00009888" value="0x042C8000" />
+        <register type="NOA" address="0x00009888" value="0x062C8000" />
+        <register type="NOA" address="0x00009888" value="0x082C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C2C8000" />
+        <register type="NOA" address="0x00009888" value="0x1190F800" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x43900842" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900002" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00100070" />
+        <register type="OA" address="0x00002774" value="0x0000FFF1" />
+        <register type="OA" address="0x00002778" value="0x00028002" />
+        <register type="OA" address="0x0000277C" value="0x000087FF" />
+        <register type="OA" address="0x00002780" value="0x00020002" />
+        <register type="OA" address="0x00002784" value="0x00008FFF" />
+        <register type="OA" address="0x00002788" value="0x00008002" />
+        <register type="OA" address="0x0000278C" value="0x0000A7FF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set RasterizerAndPixelBackend"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="rasterizer_and_pixel_backend"
+       hw_config_guid="52c646ca-52da-4853-877e-8645e73ed330"
+       chipset="KBLGT3"
+       symbol_name="RasterizerAndPixelBackend"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Slice0 Pixel Values Ready"
+             description="The percentage of time in which slice0 pixel values are ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="pixel_values0_ready"
+             units="percent"
+             symbol_name="PixelValues0Ready"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="Slice0 Rasterizer Input Available"
+             description="The percentage of time in which slice0 rasterizer input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="rasterizer0_input_available"
+             units="percent"
+             symbol_name="Rasterizer0InputAvailable"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Slice0 Post-EarlyZ Pixel Data Ready"
+             description="The percentage of time in which slice0 post-EarlyZ pixel data is ready (after early Z tests have been applied)"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="pixel_data0_ready"
+             units="percent"
+             symbol_name="PixelData0Ready"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer/Early Depth Test"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 Rasterizer Output Ready"
+             description="The percentage of time in which slice0 rasterizer output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="rasterizer0_output_ready"
+             units="percent"
+             symbol_name="Rasterizer0OutputReady"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Slice0 PS Output Available"
+             description="The percentage of time in which slice0 PS output is available"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_output0_available"
+             units="percent"
+             symbol_name="PSOutput0Available"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x102F3800" />
+        <register type="NOA" address="0x00009888" value="0x144D0500" />
+        <register type="NOA" address="0x00009888" value="0x120D03C0" />
+        <register type="NOA" address="0x00009888" value="0x140D03CF" />
+        <register type="NOA" address="0x00009888" value="0x0C0F0004" />
+        <register type="NOA" address="0x00009888" value="0x0C4E4000" />
+        <register type="NOA" address="0x00009888" value="0x042F0480" />
+        <register type="NOA" address="0x00009888" value="0x082F0000" />
+        <register type="NOA" address="0x00009888" value="0x022F0000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C0090" />
+        <register type="NOA" address="0x00009888" value="0x064D0027" />
+        <register type="NOA" address="0x00009888" value="0x004D0000" />
+        <register type="NOA" address="0x00009888" value="0x000D0D40" />
+        <register type="NOA" address="0x00009888" value="0x020D803F" />
+        <register type="NOA" address="0x00009888" value="0x040D8023" />
+        <register type="NOA" address="0x00009888" value="0x100D0000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x020F0010" />
+        <register type="NOA" address="0x00009888" value="0x000F0000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0050" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C2C8000" />
+        <register type="NOA" address="0x00009888" value="0x1190FC00" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41901400" />
+        <register type="NOA" address="0x00009888" value="0x43901485" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900001" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x30800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00000002" />
+        <register type="OA" address="0x00002774" value="0x0000EFFF" />
+        <register type="OA" address="0x00002778" value="0x00006000" />
+        <register type="OA" address="0x0000277C" value="0x0000F3FF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set Sampler"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="sampler"
+       hw_config_guid="c4bb682f-677c-4875-990b-005230be87b4"
+       chipset="KBLGT3"
+       symbol_name="Sampler"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 Subslice2 Input Available"
+             description="The percentage of time in which slice0 subslice2 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler02_input_available"
+             units="percent"
+             symbol_name="Sampler02InputAvailable"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 Subslice0 Input Available"
+             description="The percentage of time in which slice0 subslice0 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler00_input_available"
+             units="percent"
+             symbol_name="Sampler00InputAvailable"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="Slice0 Subslice2 Sampler Output Ready"
+             description="The percentage of time in which slice0 subslice2 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler02_output_ready"
+             units="percent"
+             symbol_name="Sampler02OutputReady"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Slice0 Subslice1 Input Available"
+             description="The percentage of time in which slice0 subslice1 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler01_input_available"
+             units="percent"
+             symbol_name="Sampler01InputAvailable"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Slice0 Subslice0 Sampler Output Ready"
+             description="The percentage of time in which slice0 subslice0 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler00_output_ready"
+             units="percent"
+             symbol_name="Sampler00OutputReady"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Slice0 Subslice1 Sampler Output Ready"
+             description="The percentage of time in which slice0 subslice1 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler01_output_ready"
+             units="percent"
+             symbol_name="Sampler01OutputReady"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x14152C00" />
+        <register type="NOA" address="0x00009888" value="0x16150005" />
+        <register type="NOA" address="0x00009888" value="0x121600A0" />
+        <register type="NOA" address="0x00009888" value="0x14352C00" />
+        <register type="NOA" address="0x00009888" value="0x16350005" />
+        <register type="NOA" address="0x00009888" value="0x123600A0" />
+        <register type="NOA" address="0x00009888" value="0x14552C00" />
+        <register type="NOA" address="0x00009888" value="0x16550005" />
+        <register type="NOA" address="0x00009888" value="0x125600A0" />
+        <register type="NOA" address="0x00009888" value="0x062F6000" />
+        <register type="NOA" address="0x00009888" value="0x022F2000" />
+        <register type="NOA" address="0x00009888" value="0x0C4C0050" />
+        <register type="NOA" address="0x00009888" value="0x0A4C0010" />
+        <register type="NOA" address="0x00009888" value="0x0C0D8000" />
+        <register type="NOA" address="0x00009888" value="0x0E0DA000" />
+        <register type="NOA" address="0x00009888" value="0x000D8000" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x100F0350" />
+        <register type="NOA" address="0x00009888" value="0x0C0FB000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F00DA" />
+        <register type="NOA" address="0x00009888" value="0x182C0028" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x022DC000" />
+        <register type="NOA" address="0x00009888" value="0x042D4000" />
+        <register type="NOA" address="0x00009888" value="0x0C138000" />
+        <register type="NOA" address="0x00009888" value="0x0E132000" />
+        <register type="NOA" address="0x00009888" value="0x0413C000" />
+        <register type="NOA" address="0x00009888" value="0x1C140018" />
+        <register type="NOA" address="0x00009888" value="0x0C157000" />
+        <register type="NOA" address="0x00009888" value="0x0E150078" />
+        <register type="NOA" address="0x00009888" value="0x10150000" />
+        <register type="NOA" address="0x00009888" value="0x04162180" />
+        <register type="NOA" address="0x00009888" value="0x02160000" />
+        <register type="NOA" address="0x00009888" value="0x04174000" />
+        <register type="NOA" address="0x00009888" value="0x0233A000" />
+        <register type="NOA" address="0x00009888" value="0x04333000" />
+        <register type="NOA" address="0x00009888" value="0x14348000" />
+        <register type="NOA" address="0x00009888" value="0x16348000" />
+        <register type="NOA" address="0x00009888" value="0x02357870" />
+        <register type="NOA" address="0x00009888" value="0x10350000" />
+        <register type="NOA" address="0x00009888" value="0x04360043" />
+        <register type="NOA" address="0x00009888" value="0x02360000" />
+        <register type="NOA" address="0x00009888" value="0x04371000" />
+        <register type="NOA" address="0x00009888" value="0x0E538000" />
+        <register type="NOA" address="0x00009888" value="0x00538000" />
+        <register type="NOA" address="0x00009888" value="0x06533000" />
+        <register type="NOA" address="0x00009888" value="0x1C540020" />
+        <register type="NOA" address="0x00009888" value="0x12548000" />
+        <register type="NOA" address="0x00009888" value="0x0E557000" />
+        <register type="NOA" address="0x00009888" value="0x00557800" />
+        <register type="NOA" address="0x00009888" value="0x10550000" />
+        <register type="NOA" address="0x00009888" value="0x06560043" />
+        <register type="NOA" address="0x00009888" value="0x02560000" />
+        <register type="NOA" address="0x00009888" value="0x06571000" />
+        <register type="NOA" address="0x00009888" value="0x1190FF80" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900060" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900C00" />
+        <register type="NOA" address="0x00009888" value="0x43900842" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900060" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x70800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x0000C000" />
+        <register type="OA" address="0x00002774" value="0x0000E7FF" />
+        <register type="OA" address="0x00002778" value="0x00003000" />
+        <register type="OA" address="0x0000277C" value="0x0000F9FF" />
+        <register type="OA" address="0x00002780" value="0x00000C00" />
+        <register type="OA" address="0x00002784" value="0x0000FE7F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set TDL_1"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="tdl_1"
+       hw_config_guid="ade8521b-5e72-45d4-8c25-d9f0da774899"
+       chipset="KBLGT3"
+       symbol_name="TDL_1"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="NonPS Thread Ready For Dispatch on Slice0 Subslice2"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice2 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread02_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread02ReadyForDispatch"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="NonPS Thread Ready For Dispatch on Slice0 Subslice0"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice0 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread00_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread00ReadyForDispatch"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Subslice0"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice0 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread00_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread00ReadyForDispatch"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Subslice1"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice1 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread01_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread01ReadyForDispatch"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Subslice2"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice2 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread02_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread02ReadyForDispatch"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="NonPS Thread Ready For Dispatch on Slice0 Subslice1"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice1 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread01_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread01ReadyForDispatch"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x12120000" />
+        <register type="NOA" address="0x00009888" value="0x12320000" />
+        <register type="NOA" address="0x00009888" value="0x12520000" />
+        <register type="NOA" address="0x00009888" value="0x002F8000" />
+        <register type="NOA" address="0x00009888" value="0x022F3000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C0015" />
+        <register type="NOA" address="0x00009888" value="0x0C0D8000" />
+        <register type="NOA" address="0x00009888" value="0x0E0DA000" />
+        <register type="NOA" address="0x00009888" value="0x000D8000" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x100F03A0" />
+        <register type="NOA" address="0x00009888" value="0x0C0FF000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0095" />
+        <register type="NOA" address="0x00009888" value="0x062C8000" />
+        <register type="NOA" address="0x00009888" value="0x082C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C2D8000" />
+        <register type="NOA" address="0x00009888" value="0x0E2D4000" />
+        <register type="NOA" address="0x00009888" value="0x062D4000" />
+        <register type="NOA" address="0x00009888" value="0x02108000" />
+        <register type="NOA" address="0x00009888" value="0x0410C000" />
+        <register type="NOA" address="0x00009888" value="0x02118000" />
+        <register type="NOA" address="0x00009888" value="0x0411C000" />
+        <register type="NOA" address="0x00009888" value="0x02121880" />
+        <register type="NOA" address="0x00009888" value="0x041219B5" />
+        <register type="NOA" address="0x00009888" value="0x00120000" />
+        <register type="NOA" address="0x00009888" value="0x02134000" />
+        <register type="NOA" address="0x00009888" value="0x04135000" />
+        <register type="NOA" address="0x00009888" value="0x0C308000" />
+        <register type="NOA" address="0x00009888" value="0x0E304000" />
+        <register type="NOA" address="0x00009888" value="0x06304000" />
+        <register type="NOA" address="0x00009888" value="0x0C318000" />
+        <register type="NOA" address="0x00009888" value="0x0E314000" />
+        <register type="NOA" address="0x00009888" value="0x06314000" />
+        <register type="NOA" address="0x00009888" value="0x0C321A80" />
+        <register type="NOA" address="0x00009888" value="0x0E320033" />
+        <register type="NOA" address="0x00009888" value="0x06320031" />
+        <register type="NOA" address="0x00009888" value="0x00320000" />
+        <register type="NOA" address="0x00009888" value="0x0C334000" />
+        <register type="NOA" address="0x00009888" value="0x0E331000" />
+        <register type="NOA" address="0x00009888" value="0x06331000" />
+        <register type="NOA" address="0x00009888" value="0x0E508000" />
+        <register type="NOA" address="0x00009888" value="0x00508000" />
+        <register type="NOA" address="0x00009888" value="0x02504000" />
+        <register type="NOA" address="0x00009888" value="0x0E518000" />
+        <register type="NOA" address="0x00009888" value="0x00518000" />
+        <register type="NOA" address="0x00009888" value="0x02514000" />
+        <register type="NOA" address="0x00009888" value="0x0E521880" />
+        <register type="NOA" address="0x00009888" value="0x00521A80" />
+        <register type="NOA" address="0x00009888" value="0x02520033" />
+        <register type="NOA" address="0x00009888" value="0x0E534000" />
+        <register type="NOA" address="0x00009888" value="0x00534000" />
+        <register type="NOA" address="0x00009888" value="0x02531000" />
+        <register type="NOA" address="0x00009888" value="0x1190FF80" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900800" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900062" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900C00" />
+        <register type="NOA" address="0x00009888" value="0x43900003" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900040" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x30800000" />
+        <register type="OA" address="0x00002770" value="0x00000002" />
+        <register type="OA" address="0x00002774" value="0x00007FFF" />
+        <register type="OA" address="0x00002778" value="0x00000000" />
+        <register type="OA" address="0x0000277C" value="0x00009FFF" />
+        <register type="OA" address="0x00002780" value="0x00000002" />
+        <register type="OA" address="0x00002784" value="0x0000EFFF" />
+        <register type="OA" address="0x00002788" value="0x00000000" />
+        <register type="OA" address="0x0000278C" value="0x0000F3FF" />
+        <register type="OA" address="0x00002790" value="0x00000002" />
+        <register type="OA" address="0x00002794" value="0x0000FDFF" />
+        <register type="OA" address="0x00002798" value="0x00000000" />
+        <register type="OA" address="0x0000279C" value="0x0000FE7F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set TDL_2"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="tdl_2"
+       hw_config_guid="9df2815d-4e9e-417f-bde1-3788dc6e1ea1"
+       chipset="KBLGT3"
+       symbol_name="TDL_2"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice1 Port 0"
+             description="The percentage of time in which thread header is ready on slice0 subslice1 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header01_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader01ReadyPort0"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice1 Port 1"
+             description="The percentage of time in which thread header is ready on slice0 subslice1 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header01_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader01ReadyPort1"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice2 Port 1"
+             description="The percentage of time in which thread header is ready on slice0 subslice2 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header02_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader02ReadyPort1"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice2 Port 0"
+             description="The percentage of time in which thread header is ready on slice0 subslice2 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header02_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader02ReadyPort0"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice0 Port 0"
+             description="The percentage of time in which thread header is ready on slice0 subslice0 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header00_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader00ReadyPort0"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice0 Port 1"
+             description="The percentage of time in which thread header is ready on slice0 subslice0 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header00_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader00ReadyPort1"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x12124D60" />
+        <register type="NOA" address="0x00009888" value="0x12322E60" />
+        <register type="NOA" address="0x00009888" value="0x12524D60" />
+        <register type="NOA" address="0x00009888" value="0x022F3000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C0014" />
+        <register type="NOA" address="0x00009888" value="0x000D8000" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x0C0FE000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0097" />
+        <register type="NOA" address="0x00009888" value="0x082C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x002D8000" />
+        <register type="NOA" address="0x00009888" value="0x062D4000" />
+        <register type="NOA" address="0x00009888" value="0x0410C000" />
+        <register type="NOA" address="0x00009888" value="0x0411C000" />
+        <register type="NOA" address="0x00009888" value="0x04121FB7" />
+        <register type="NOA" address="0x00009888" value="0x00120000" />
+        <register type="NOA" address="0x00009888" value="0x04135000" />
+        <register type="NOA" address="0x00009888" value="0x00308000" />
+        <register type="NOA" address="0x00009888" value="0x06304000" />
+        <register type="NOA" address="0x00009888" value="0x00318000" />
+        <register type="NOA" address="0x00009888" value="0x06314000" />
+        <register type="NOA" address="0x00009888" value="0x00321B80" />
+        <register type="NOA" address="0x00009888" value="0x0632003F" />
+        <register type="NOA" address="0x00009888" value="0x00334000" />
+        <register type="NOA" address="0x00009888" value="0x06331000" />
+        <register type="NOA" address="0x00009888" value="0x0250C000" />
+        <register type="NOA" address="0x00009888" value="0x0251C000" />
+        <register type="NOA" address="0x00009888" value="0x02521FB7" />
+        <register type="NOA" address="0x00009888" value="0x00520000" />
+        <register type="NOA" address="0x00009888" value="0x02535000" />
+        <register type="NOA" address="0x00009888" value="0x1190FC00" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900800" />
+        <register type="NOA" address="0x00009888" value="0x43900063" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900040" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Compute Metrics Extra Gen9"
+       mdapi_supported_apis="VK OGL4 OCL IO BB"
+       underscore_name="compute_extra"
+       hw_config_guid="efc497ac-884e-4ee4-a4a8-15fba22aaf21"
+       chipset="KBLGT3"
+       symbol_name="ComputeExtra"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active"
+             units="percent"
+             symbol_name="Fpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Pipe Active including Ext Math"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing including Extended Math processing"
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ  C 5 READ C 6 READ FADD C 7 READ FADD C 2 READ FADD C 3 READ FADD C 4 READ FADD 8 FMUL FADD 100 FMUL $EuCoresTotalCount FDIV $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active_adjusted"
+             units="percent"
+             symbol_name="Fpu1ActiveAdjusted"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x121203E0" />
+        <register type="NOA" address="0x00009888" value="0x123203E0" />
+        <register type="NOA" address="0x00009888" value="0x125203E0" />
+        <register type="NOA" address="0x00009888" value="0x129203E0" />
+        <register type="NOA" address="0x00009888" value="0x12B203E0" />
+        <register type="NOA" address="0x00009888" value="0x12D203E0" />
+        <register type="NOA" address="0x00009888" value="0x024EC000" />
+        <register type="NOA" address="0x00009888" value="0x044EC000" />
+        <register type="NOA" address="0x00009888" value="0x064EC000" />
+        <register type="NOA" address="0x00009888" value="0x022F4000" />
+        <register type="NOA" address="0x00009888" value="0x084CA000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C0042" />
+        <register type="NOA" address="0x00009888" value="0x000D8000" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F5000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F006D" />
+        <register type="NOA" address="0x00009888" value="0x022C8000" />
+        <register type="NOA" address="0x00009888" value="0x042C8000" />
+        <register type="NOA" address="0x00009888" value="0x062C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C2C8000" />
+        <register type="NOA" address="0x00009888" value="0x042D8000" />
+        <register type="NOA" address="0x00009888" value="0x06104000" />
+        <register type="NOA" address="0x00009888" value="0x06114000" />
+        <register type="NOA" address="0x00009888" value="0x06120033" />
+        <register type="NOA" address="0x00009888" value="0x00120000" />
+        <register type="NOA" address="0x00009888" value="0x06131000" />
+        <register type="NOA" address="0x00009888" value="0x04308000" />
+        <register type="NOA" address="0x00009888" value="0x04318000" />
+        <register type="NOA" address="0x00009888" value="0x04321980" />
+        <register type="NOA" address="0x00009888" value="0x00320000" />
+        <register type="NOA" address="0x00009888" value="0x04334000" />
+        <register type="NOA" address="0x00009888" value="0x04504000" />
+        <register type="NOA" address="0x00009888" value="0x04514000" />
+        <register type="NOA" address="0x00009888" value="0x04520033" />
+        <register type="NOA" address="0x00009888" value="0x00520000" />
+        <register type="NOA" address="0x00009888" value="0x04531000" />
+        <register type="NOA" address="0x00009888" value="0x00AF8000" />
+        <register type="NOA" address="0x00009888" value="0x0ACC0001" />
+        <register type="NOA" address="0x00009888" value="0x008D8000" />
+        <register type="NOA" address="0x00009888" value="0x028DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C8FB000" />
+        <register type="NOA" address="0x00009888" value="0x0E8F0001" />
+        <register type="NOA" address="0x00009888" value="0x06AC8000" />
+        <register type="NOA" address="0x00009888" value="0x02AD4000" />
+        <register type="NOA" address="0x00009888" value="0x02908000" />
+        <register type="NOA" address="0x00009888" value="0x02918000" />
+        <register type="NOA" address="0x00009888" value="0x02921980" />
+        <register type="NOA" address="0x00009888" value="0x00920000" />
+        <register type="NOA" address="0x00009888" value="0x02934000" />
+        <register type="NOA" address="0x00009888" value="0x02B04000" />
+        <register type="NOA" address="0x00009888" value="0x02B14000" />
+        <register type="NOA" address="0x00009888" value="0x02B20033" />
+        <register type="NOA" address="0x00009888" value="0x00B20000" />
+        <register type="NOA" address="0x00009888" value="0x02B31000" />
+        <register type="NOA" address="0x00009888" value="0x00D08000" />
+        <register type="NOA" address="0x00009888" value="0x00D18000" />
+        <register type="NOA" address="0x00009888" value="0x00D21980" />
+        <register type="NOA" address="0x00009888" value="0x00D34000" />
+        <register type="NOA" address="0x00009888" value="0x1190FC00" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900C00" />
+        <register type="NOA" address="0x00009888" value="0x43900002" />
+        <register type="NOA" address="0x00009888" value="0x53900420" />
+        <register type="NOA" address="0x00009888" value="0x459000A1" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+  </set>
+
+  <set name="Media Vme Pipe Gen9"
+       mdapi_supported_apis="MEDIA IO BB"
+       underscore_name="vme_pipe"
+       hw_config_guid="bfd9764d-2c5b-4c16-bfc1-89de3ca10917"
+       chipset="KBLGT3"
+       symbol_name="VMEPipe"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="EU Thread Occupancy"
+             description="The percentage of time in which hardware threads occupied EUs."
+             data_type="float"
+             max_equation="100"
+             equation="8 A 10 READ FMUL $EuThreadsCount FDIV $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_thread_occupancy"
+             units="percent"
+             symbol_name="EuThreadOccupancy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VME Busy"
+             description="The percentage of time in which VME (IME or CRE) was actively processing data."
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ B 3 READ FADD 2 FDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vme_busy"
+             units="percent"
+             symbol_name="VMEBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Overview System Batch Tier2"
+             mdapi_group="VME Pipe"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x141A5800" />
+        <register type="NOA" address="0x00009888" value="0x161A00C0" />
+        <register type="NOA" address="0x00009888" value="0x12180240" />
+        <register type="NOA" address="0x00009888" value="0x14180002" />
+        <register type="NOA" address="0x00009888" value="0x149A5800" />
+        <register type="NOA" address="0x00009888" value="0x169A00C0" />
+        <register type="NOA" address="0x00009888" value="0x12980240" />
+        <register type="NOA" address="0x00009888" value="0x14980002" />
+        <register type="NOA" address="0x00009888" value="0x1A4E3FC0" />
+        <register type="NOA" address="0x00009888" value="0x002F1000" />
+        <register type="NOA" address="0x00009888" value="0x022F8000" />
+        <register type="NOA" address="0x00009888" value="0x042F3000" />
+        <register type="NOA" address="0x00009888" value="0x004C4000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C9500" />
+        <register type="NOA" address="0x00009888" value="0x0C4C002A" />
+        <register type="NOA" address="0x00009888" value="0x000D2000" />
+        <register type="NOA" address="0x00009888" value="0x060D8000" />
+        <register type="NOA" address="0x00009888" value="0x080DA000" />
+        <register type="NOA" address="0x00009888" value="0x0A0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F0400" />
+        <register type="NOA" address="0x00009888" value="0x0E0F5500" />
+        <register type="NOA" address="0x00009888" value="0x100F0015" />
+        <register type="NOA" address="0x00009888" value="0x002C8000" />
+        <register type="NOA" address="0x00009888" value="0x0E2C8000" />
+        <register type="NOA" address="0x00009888" value="0x162CAA00" />
+        <register type="NOA" address="0x00009888" value="0x182C000A" />
+        <register type="NOA" address="0x00009888" value="0x04193000" />
+        <register type="NOA" address="0x00009888" value="0x081A28C1" />
+        <register type="NOA" address="0x00009888" value="0x001A0000" />
+        <register type="NOA" address="0x00009888" value="0x00133000" />
+        <register type="NOA" address="0x00009888" value="0x0613C000" />
+        <register type="NOA" address="0x00009888" value="0x0813F000" />
+        <register type="NOA" address="0x00009888" value="0x00172000" />
+        <register type="NOA" address="0x00009888" value="0x06178000" />
+        <register type="NOA" address="0x00009888" value="0x0817A000" />
+        <register type="NOA" address="0x00009888" value="0x00180037" />
+        <register type="NOA" address="0x00009888" value="0x06180940" />
+        <register type="NOA" address="0x00009888" value="0x08180000" />
+        <register type="NOA" address="0x00009888" value="0x02180000" />
+        <register type="NOA" address="0x00009888" value="0x04183000" />
+        <register type="NOA" address="0x00009888" value="0x04AFC000" />
+        <register type="NOA" address="0x00009888" value="0x06AF3000" />
+        <register type="NOA" address="0x00009888" value="0x0ACC4000" />
+        <register type="NOA" address="0x00009888" value="0x0CCC0015" />
+        <register type="NOA" address="0x00009888" value="0x0A8DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C8DA000" />
+        <register type="NOA" address="0x00009888" value="0x0E8F4000" />
+        <register type="NOA" address="0x00009888" value="0x108F0015" />
+        <register type="NOA" address="0x00009888" value="0x16ACA000" />
+        <register type="NOA" address="0x00009888" value="0x18AC000A" />
+        <register type="NOA" address="0x00009888" value="0x06993000" />
+        <register type="NOA" address="0x00009888" value="0x0C9A28C1" />
+        <register type="NOA" address="0x00009888" value="0x009A0000" />
+        <register type="NOA" address="0x00009888" value="0x0A93F000" />
+        <register type="NOA" address="0x00009888" value="0x0C93F000" />
+        <register type="NOA" address="0x00009888" value="0x0A97A000" />
+        <register type="NOA" address="0x00009888" value="0x0C97A000" />
+        <register type="NOA" address="0x00009888" value="0x0A980977" />
+        <register type="NOA" address="0x00009888" value="0x08980000" />
+        <register type="NOA" address="0x00009888" value="0x04980000" />
+        <register type="NOA" address="0x00009888" value="0x06983000" />
+        <register type="NOA" address="0x00009888" value="0x119000FF" />
+        <register type="NOA" address="0x00009888" value="0x51900040" />
+        <register type="NOA" address="0x00009888" value="0x41900020" />
+        <register type="NOA" address="0x00009888" value="0x55900004" />
+        <register type="NOA" address="0x00009888" value="0x45900400" />
+        <register type="NOA" address="0x00009888" value="0x479008A5" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900002" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x30800000" />
+        <register type="OA" address="0x00002770" value="0x00100030" />
+        <register type="OA" address="0x00002774" value="0x0000FFF9" />
+        <register type="OA" address="0x00002778" value="0x00000002" />
+        <register type="OA" address="0x0000277C" value="0x0000FFFC" />
+        <register type="OA" address="0x00002780" value="0x00000002" />
+        <register type="OA" address="0x00002784" value="0x0000FFF3" />
+        <register type="OA" address="0x00002788" value="0x00100180" />
+        <register type="OA" address="0x0000278C" value="0x0000FFCF" />
+        <register type="OA" address="0x00002790" value="0x00000002" />
+        <register type="OA" address="0x00002794" value="0x0000FFCF" />
+        <register type="OA" address="0x00002798" value="0x00000002" />
+        <register type="OA" address="0x0000279C" value="0x0000FF3F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00008003" />
+    </register_config>
+  </set>
+
+  <set name="Gpu Rings Busyness"
+       mdapi_supported_apis="VK OGL OCL MEDIA IO BB"
+       underscore_name="gpu_busyness"
+       hw_config_guid="b55ecba1-2aa9-422e-89ff-b9e30f03d447"
+       chipset="KBLGT3"
+       symbol_name="GpuBusyness"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="Vebox Ring Busy"
+             description="The percentage of time when vebox command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vebox_busy"
+             units="percent"
+             symbol_name="VeboxBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Render Ring Busy"
+             description="The percentage of time when render command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="render_busy"
+             units="percent"
+             symbol_name="RenderBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Vdbox0 Ring Busy"
+             description="The percentage of time when Vdbox0 command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vdbox0_busy"
+             units="percent"
+             symbol_name="Vdbox0Busy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Blitter Ring Busy"
+             description="The percentage of time when blitter command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="blitter_busy"
+             units="percent"
+             symbol_name="BlitterBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="AnyRingBusy"
+             description="The percentage of time when any command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="any_ring_busy"
+             units="percent"
+             symbol_name="AnyRingBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Vdbox1 Ring Busy"
+             description="The percentage of time when Vdbox1 command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vdbox1_busy"
+             units="percent"
+             symbol_name="Vdbox1Busy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x19D05800" />
+        <register type="NOA" address="0x00009888" value="0x13805800" />
+        <register type="NOA" address="0x00009888" value="0x05962C25" />
+        <register type="NOA" address="0x00009888" value="0x19950016" />
+        <register type="NOA" address="0x00009888" value="0x19C05800" />
+        <register type="NOA" address="0x00009888" value="0x05D00085" />
+        <register type="NOA" address="0x00009888" value="0x25D00000" />
+        <register type="NOA" address="0x00009888" value="0x09D54000" />
+        <register type="NOA" address="0x00009888" value="0x07800035" />
+        <register type="NOA" address="0x00009888" value="0x11800000" />
+        <register type="NOA" address="0x00009888" value="0x1D810400" />
+        <register type="NOA" address="0x00009888" value="0x21960000" />
+        <register type="NOA" address="0x00009888" value="0x0996C000" />
+        <register type="NOA" address="0x00009888" value="0x0B964000" />
+        <register type="NOA" address="0x00009888" value="0x19938000" />
+        <register type="NOA" address="0x00009888" value="0x1B930068" />
+        <register type="NOA" address="0x00009888" value="0x15948000" />
+        <register type="NOA" address="0x00009888" value="0x1B94000C" />
+        <register type="NOA" address="0x00009888" value="0x03957500" />
+        <register type="NOA" address="0x00009888" value="0x1D950000" />
+        <register type="NOA" address="0x00009888" value="0x17950000" />
+        <register type="NOA" address="0x00009888" value="0x07E54000" />
+        <register type="NOA" address="0x00009888" value="0x07928000" />
+        <register type="NOA" address="0x00009888" value="0x03988000" />
+        <register type="NOA" address="0x00009888" value="0x17908000" />
+        <register type="NOA" address="0x00009888" value="0x19904000" />
+        <register type="NOA" address="0x00009888" value="0x1B908000" />
+        <register type="NOA" address="0x00009888" value="0x1D908000" />
+        <register type="NOA" address="0x00009888" value="0x1F908000" />
+        <register type="NOA" address="0x00009888" value="0x09978000" />
+        <register type="NOA" address="0x00009888" value="0x05C08500" />
+        <register type="NOA" address="0x00009888" value="0x25C00000" />
+        <register type="NOA" address="0x00009888" value="0x1BC00000" />
+        <register type="NOA" address="0x00009888" value="0x0BC54000" />
+        <register type="NOA" address="0x00009888" value="0x11900000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x43900463" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900040" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x10800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x0007C000" />
+        <register type="OA" address="0x00002774" value="0x000007FF" />
+    </register_config>
+  </set>
+
+  <set name="MDAPI testing set Gen9"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="test_oa"
+       hw_config_guid="f1792f32-6db2-4b50-b4b2-557128f1688d"
+       chipset="KBLGT3"
+       symbol_name="TestOa"
+       >
+    <counter name="TestCounter7"
+             description="HW test counter 7. Factor: 0.666"
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="counter7"
+             units="events"
+             symbol_name="Counter7"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="TestCounter8"
+             description="HW test counter 8. Should be equal to 1."
+             data_type="uint64"
+             equation="C 7 READ"
+             underscore_name="counter8"
+             units="events"
+             symbol_name="Counter8"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter4"
+             description="HW test counter 4. Factor: 0.333"
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="counter4"
+             units="events"
+             symbol_name="Counter4"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter5"
+             description="HW test counter 5. Factor: 0.333"
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="counter5"
+             units="events"
+             symbol_name="Counter5"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter6"
+             description="HW test counter 6. Factor: 0.166"
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="counter6"
+             units="events"
+             symbol_name="Counter6"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter3"
+             description="HW test counter 3. Factor: 0.5"
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="counter3"
+             units="events"
+             symbol_name="Counter3"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter0"
+             description="HW test counter 0. Factor: 0.0"
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="counter0"
+             units="events"
+             symbol_name="Counter0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter1"
+             description="HW test counter 1. Factor: 1.0"
+             data_type="uint64"
+             equation="B 1 READ"
+             underscore_name="counter1"
+             units="events"
+             symbol_name="Counter1"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter2"
+             description="HW test counter 2. Factor: 1.0"
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="counter2"
+             units="events"
+             symbol_name="Counter2"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x11810000" />
+        <register type="NOA" address="0x00009888" value="0x07810013" />
+        <register type="NOA" address="0x00009888" value="0x1F810000" />
+        <register type="NOA" address="0x00009888" value="0x1D810000" />
+        <register type="NOA" address="0x00009888" value="0x1B930040" />
+        <register type="NOA" address="0x00009888" value="0x07E54000" />
+        <register type="NOA" address="0x00009888" value="0x1F908000" />
+        <register type="NOA" address="0x00009888" value="0x11900000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x00000004" />
+        <register type="OA" address="0x00002774" value="0x00000000" />
+        <register type="OA" address="0x00002778" value="0x00000003" />
+        <register type="OA" address="0x0000277C" value="0x00000000" />
+        <register type="OA" address="0x00002780" value="0x00000007" />
+        <register type="OA" address="0x00002784" value="0x00000000" />
+        <register type="OA" address="0x00002788" value="0x00100002" />
+        <register type="OA" address="0x0000278C" value="0x0000FFF7" />
+        <register type="OA" address="0x00002790" value="0x00100002" />
+        <register type="OA" address="0x00002794" value="0x0000FFCF" />
+        <register type="OA" address="0x00002798" value="0x00100082" />
+        <register type="OA" address="0x0000279C" value="0x0000FFEF" />
+        <register type="OA" address="0x000027A0" value="0x001000C2" />
+        <register type="OA" address="0x000027A4" value="0x0000FFE7" />
+        <register type="OA" address="0x000027A8" value="0x00100001" />
+        <register type="OA" address="0x000027AC" value="0x0000FFE7" />
+    </register_config>
+  </set>
+
+  <set name="Metric set PMA Stall"
+       mdapi_supported_apis="VK OGL OGL4 OCL IO MEDIA"
+       underscore_name="pma__stall"
+       hw_config_guid="85bc2e4f-2563-4388-921b-dc0dad879cf3"
+       chipset="KBLGT3"
+       symbol_name="PMA_Stall"
+       >
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="STC PMA stall"
+             description="Percentage of time when stencil cache line and an overlapping pixel are causing stalls"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ B 1 READ FADD 2 FDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="stc_pma_stall"
+             units="percent"
+             symbol_name="StcPMAStall"
+             availability="$SliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_group="GPU/Stencil Cache"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x122D3080" />
+        <register type="NOA" address="0x00009888" value="0x000D2000" />
+        <register type="NOA" address="0x00009888" value="0x060D8000" />
+        <register type="NOA" address="0x00009888" value="0x080DA000" />
+        <register type="NOA" address="0x00009888" value="0x0A0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F0800" />
+        <register type="NOA" address="0x00009888" value="0x0E0FAA00" />
+        <register type="NOA" address="0x00009888" value="0x100F0002" />
+        <register type="NOA" address="0x00009888" value="0x002D0025" />
+        <register type="NOA" address="0x00009888" value="0x062D1300" />
+        <register type="NOA" address="0x00009888" value="0x082D16A4" />
+        <register type="NOA" address="0x00009888" value="0x0A2D162E" />
+        <register type="NOA" address="0x00009888" value="0x102D0000" />
+        <register type="NOA" address="0x00009888" value="0x1190003F" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900000" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900000" />
+        <register type="NOA" address="0x00009888" value="0x47900000" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x30800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00E00021" />
+        <register type="OA" address="0x00002774" value="0x0007FFF8" />
+        <register type="OA" address="0x00002778" value="0x07000101" />
+        <register type="OA" address="0x0000277C" value="0x0038FFC7" />
+    </register_config>
+  </set>
+
+</metrics>
diff --git a/lib/i915/perf-configs/oa-lkf.xml b/lib/i915/perf-configs/oa-lkf.xml
new file mode 100644
index 00000000..9b677468
--- /dev/null
+++ b/lib/i915/perf-configs/oa-lkf.xml
@@ -0,0 +1,11803 @@
+<?xml version="1.0"?>
+<metrics version="1581936283" merge_md5="">
+  <set name="Render Metrics Basic Gen11"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="render_basic"
+       hw_config_guid="807f52f4-e457-4da4-b2b6-9a7b6dc2b1ed"
+       chipset="LKF"
+       symbol_name="RenderBasic"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Cache Misses"
+             description="The total number of sampler cache misses in all LODs in all sampler units."
+             data_type="uint64"
+             equation="C 4 READ C 5 READ UADD 2 UMUL"
+             underscore_name="sampler_l1_misses"
+             units="messages"
+             symbol_name="SamplerL1Misses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Sampler00 Busy"
+             description="The percentage of time in which Slice0 Sampler0 has been processing EU requests."
+             data_type="float"
+             max_equation="100"
+             equation="C 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler00_busy"
+             units="percent"
+             symbol_name="Sampler00Busy"
+             availability="$SubsliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Samplers Busy"
+             description="The percentage of time in which samplers have been processing EU requests."
+             data_type="float"
+             max_equation="100"
+             equation="$Sampler00Busy"
+             underscore_name="samplers_busy"
+             units="percent"
+             symbol_name="SamplersBusy"
+             availability="$SubsliceMask 9 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="Sampler00 Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which Slice0 Sampler0 has been slowing down the pipe when processing EU requests."
+             data_type="float"
+             high_watermark="15"
+             equation="C 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="sampler00_bottleneck"
+             units="percent"
+             symbol_name="Sampler00Bottleneck"
+             availability="$SubsliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Read Throughput"
+             description="The total number of GPU memory bytes read from GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="64  B 5 READ B 4 READ UADD UMUL"
+             underscore_name="gti_read_throughput"
+             units="bytes"
+             symbol_name="GtiReadThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 14 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Samplers Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which samplers have been slowing down the pipe when processing EU requests."
+             data_type="float"
+             high_watermark="15"
+             equation="$Sampler00Bottleneck"
+             max_equation="100"
+             underscore_name="sampler_bottleneck"
+             units="percent"
+             symbol_name="SamplerBottleneck"
+             availability="$SubsliceMask 9 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Indicate System Frame Batch Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="GTI Write Throughput"
+             description="The total number of GPU memory bytes written to GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="64  B 0 READ B 2 READ UADD UMUL"
+             underscore_name="gti_write_throughput"
+             units="bytes"
+             symbol_name="GtiWriteThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ A 31 READ UADD A 32 READ UADD 64 UMUL"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009840" value="0x00000000" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x142C0014" />
+        <register type="NOA" address="0x00009888" value="0x14120700" />
+        <register type="NOA" address="0x00009888" value="0x121500E0" />
+        <register type="NOA" address="0x00009888" value="0x1E1E0030" />
+        <register type="NOA" address="0x00009888" value="0x1A204000" />
+        <register type="NOA" address="0x00009888" value="0x1C200001" />
+        <register type="NOA" address="0x00009888" value="0x1E213000" />
+        <register type="NOA" address="0x00009888" value="0x0E2C1831" />
+        <register type="NOA" address="0x00009888" value="0x102C0000" />
+        <register type="NOA" address="0x00009888" value="0x182C0000" />
+        <register type="NOA" address="0x00009888" value="0x10040140" />
+        <register type="NOA" address="0x00009888" value="0x0E040005" />
+        <register type="NOA" address="0x00009888" value="0x14050050" />
+        <register type="NOA" address="0x00009888" value="0x06054000" />
+        <register type="NOA" address="0x00009888" value="0x08051000" />
+        <register type="NOA" address="0x00009888" value="0x260600C0" />
+        <register type="NOA" address="0x00009888" value="0x24061800" />
+        <register type="NOA" address="0x00009888" value="0x04120023" />
+        <register type="NOA" address="0x00009888" value="0x10120000" />
+        <register type="NOA" address="0x00009888" value="0x08120000" />
+        <register type="NOA" address="0x00009888" value="0x06131000" />
+        <register type="NOA" address="0x00009888" value="0x04144000" />
+        <register type="NOA" address="0x00009888" value="0x02150980" />
+        <register type="NOA" address="0x00009888" value="0x10150000" />
+        <register type="NOA" address="0x00009888" value="0x1815000F" />
+        <register type="NOA" address="0x00009888" value="0x06150000" />
+        <register type="NOA" address="0x00009888" value="0x08154000" />
+        <register type="NOA" address="0x00009888" value="0x0E18A000" />
+        <register type="NOA" address="0x00009888" value="0x14190028" />
+        <register type="NOA" address="0x00009884" value="0x00000003" />
+        <register type="NOA" address="0x00009888" value="0x1A1C01C0" />
+        <register type="NOA" address="0x00009888" value="0x1C1C000A" />
+        <register type="NOA" address="0x00009888" value="0x1A5C01C0" />
+        <register type="NOA" address="0x00009888" value="0x1C5C000A" />
+        <register type="NOA" address="0x00009888" value="0x001C0097" />
+        <register type="NOA" address="0x00009888" value="0x0A1CA700" />
+        <register type="NOA" address="0x00009888" value="0x101C0000" />
+        <register type="NOA" address="0x00009888" value="0x081D0100" />
+        <register type="NOA" address="0x00009888" value="0x0A1D0008" />
+        <register type="NOA" address="0x00009888" value="0x085C0097" />
+        <register type="NOA" address="0x00009888" value="0x0A5C00A7" />
+        <register type="NOA" address="0x00009888" value="0x105C0000" />
+        <register type="NOA" address="0x00009888" value="0x0A5D0005" />
+        <register type="NOA" address="0x00009888" value="0x181E8000" />
+        <register type="NOA" address="0x00009888" value="0x1E1EB300" />
+        <register type="NOA" address="0x00009888" value="0x301F4000" />
+        <register type="NOA" address="0x00009888" value="0x501F2004" />
+        <register type="NOA" address="0x00009888" value="0x521F0090" />
+        <register type="NOA" address="0x00009888" value="0x541F0024" />
+        <register type="NOA" address="0x00009888" value="0x4E1F2000" />
+        <register type="NOA" address="0x00009888" value="0x3E1F6100" />
+        <register type="NOA" address="0x00009888" value="0x461F6100" />
+        <register type="NOA" address="0x00009888" value="0x481F6100" />
+        <register type="NOA" address="0x00009888" value="0x4A1F0061" />
+        <register type="NOA" address="0x00009888" value="0x141F0000" />
+        <register type="NOA" address="0x00009888" value="0x4C1F0000" />
+        <register type="NOA" address="0x00009888" value="0x421F3060" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E65C" value="0xFFFFFFFF" />
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00051050" />
+        <register type="FLEX" address="0x0000E45C" value="0x00000052" />
+    </register_config>
+  </set>
+
+  <set name="Compute Metrics Basic Gen11"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="compute_basic"
+       hw_config_guid="3d5fa517-a3e5-4d90-9ad0-b4c3d114ba9d"
+       chipset="LKF"
+       symbol_name="ComputeBasic"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Untyped Bytes Read"
+             description="The total number of typed memory bytes read via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 3 READ C 2 READ UADD $EuSubslicesTotalCount UMUL 32 UMUL"
+             underscore_name="untyped_bytes_read"
+             units="bytes"
+             symbol_name="UntypedBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Typed Bytes Written"
+             description="The total number of untyped memory bytes written via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 5 READ C 4 READ UADD $EuSubslicesTotalCount UMUL 32 UMUL"
+             underscore_name="typed_bytes_written"
+             units="bytes"
+             symbol_name="TypedBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU AVG IPC Rate"
+             description="The average rate of IPC calculated for 2 FPU pipelines."
+             data_type="float"
+             max_equation="2"
+             equation="A 9 READ A 10 READ A 11 READ FADD A 9 READ FSUB FDIV 1 FADD"
+             underscore_name="eu_avg_ipc_rate"
+             units="number"
+             symbol_name="EuAvgIpcRate"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="EU FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active"
+             units="percent"
+             symbol_name="Fpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu0_active"
+             units="percent"
+             symbol_name="Fpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Typed Atomics Accesses"
+             description="The total number of typed atomic accesses via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="B 4 READ B 5 READ FADD 2 FDIV $EuSubslicesTotalCount FMUL"
+             underscore_name="typed_atomics"
+             units="events"
+             symbol_name="TypedAtomics"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Read Throughput"
+             description="The total number of GPU memory bytes read from GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="64  B 7 READ B 6 READ UADD UMUL"
+             underscore_name="gti_read_throughput"
+             units="bytes"
+             symbol_name="GtiReadThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Untyped Writes"
+             description="The total number of untyped memory bytes written via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 1 READ C 0 READ UADD $EuSubslicesTotalCount UMUL 32 UMUL"
+             underscore_name="untyped_bytes_written"
+             units="bytes"
+             symbol_name="UntypedBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="Typed Bytes Read"
+             description="The total number of typed memory bytes read via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 7 READ C 6 READ UADD $EuSubslicesTotalCount UMUL 32 UMUL"
+             underscore_name="typed_bytes_read"
+             units="bytes"
+             symbol_name="TypedBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="EU Thread Occupancy"
+             description="The percentage of time in which hardware threads occupied EUs."
+             data_type="float"
+             max_equation="100"
+             equation="8 A 13 READ FMUL $EuThreadsCount FDIV $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_thread_occupancy"
+             units="percent"
+             symbol_name="EuThreadOccupancy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="GTI Write Throughput"
+             description="The total number of GPU memory bytes written to GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="64  B 0 READ B 2 READ UADD UMUL"
+             underscore_name="gti_write_throughput"
+             units="bytes"
+             symbol_name="GtiWriteThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ A 31 READ UADD A 32 READ UADD 64 UMUL"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="EU Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_send_active"
+             units="percent"
+             symbol_name="EuSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009840" value="0x00000000" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x12230012" />
+        <register type="NOA" address="0x00009888" value="0x10230019" />
+        <register type="NOA" address="0x00009888" value="0x12A30012" />
+        <register type="NOA" address="0x00009888" value="0x10A30019" />
+        <register type="NOA" address="0x00009888" value="0x1A200080" />
+        <register type="NOA" address="0x00009888" value="0x1C200002" />
+        <register type="NOA" address="0x00009888" value="0x04208000" />
+        <register type="NOA" address="0x00009888" value="0x08208000" />
+        <register type="NOA" address="0x00009888" value="0x0C208000" />
+        <register type="NOA" address="0x00009888" value="0x0A230031" />
+        <register type="NOA" address="0x00009888" value="0x0E231E00" />
+        <register type="NOA" address="0x00009888" value="0x0223003D" />
+        <register type="NOA" address="0x00009888" value="0x04230032" />
+        <register type="NOA" address="0x00009888" value="0x06230033" />
+        <register type="NOA" address="0x00009888" value="0x00230000" />
+        <register type="NOA" address="0x00009888" value="0x1AA08200" />
+        <register type="NOA" address="0x00009888" value="0x02A08000" />
+        <register type="NOA" address="0x00009888" value="0x06A08000" />
+        <register type="NOA" address="0x00009888" value="0x0AA08000" />
+        <register type="NOA" address="0x00009888" value="0x0AA31880" />
+        <register type="NOA" address="0x00009888" value="0x0EA3003C" />
+        <register type="NOA" address="0x00009888" value="0x00A31E80" />
+        <register type="NOA" address="0x00009888" value="0x02A31900" />
+        <register type="NOA" address="0x00009888" value="0x04A31980" />
+        <register type="NOA" address="0x00009888" value="0x0E044055" />
+        <register type="NOA" address="0x00009888" value="0x10040141" />
+        <register type="NOA" address="0x00009888" value="0x0C045000" />
+        <register type="NOA" address="0x00009888" value="0x0E055000" />
+        <register type="NOA" address="0x00009888" value="0x14050050" />
+        <register type="NOA" address="0x00009888" value="0x04054000" />
+        <register type="NOA" address="0x00009888" value="0x06055000" />
+        <register type="NOA" address="0x00009888" value="0x08055000" />
+        <register type="NOA" address="0x00009888" value="0x0A051000" />
+        <register type="NOA" address="0x00009888" value="0x260600CC" />
+        <register type="NOA" address="0x00009888" value="0x24067E00" />
+        <register type="NOA" address="0x00009888" value="0x18123000" />
+        <register type="NOA" address="0x00009888" value="0x1A12000C" />
+        <register type="NOA" address="0x00009888" value="0x0212C000" />
+        <register type="NOA" address="0x00009888" value="0x0612C000" />
+        <register type="NOA" address="0x00009888" value="0x0A12C000" />
+        <register type="NOA" address="0x00009888" value="0x08138000" />
+        <register type="NOA" address="0x00009888" value="0x0A134000" />
+        <register type="NOA" address="0x00009888" value="0x0413A000" />
+        <register type="NOA" address="0x00009888" value="0x06132000" />
+        <register type="NOA" address="0x00009888" value="0x0A148000" />
+        <register type="NOA" address="0x00009888" value="0x0E144000" />
+        <register type="NOA" address="0x00009888" value="0x00148000" />
+        <register type="NOA" address="0x00009888" value="0x02148000" />
+        <register type="NOA" address="0x00009888" value="0x04148000" />
+        <register type="NOA" address="0x00009888" value="0x16150380" />
+        <register type="NOA" address="0x00009888" value="0x1815000D" />
+        <register type="NOA" address="0x00009888" value="0x02154000" />
+        <register type="NOA" address="0x00009888" value="0x0415C000" />
+        <register type="NOA" address="0x00009888" value="0x06154000" />
+        <register type="NOA" address="0x00009888" value="0x0815C000" />
+        <register type="NOA" address="0x00009888" value="0x0A154000" />
+        <register type="NOA" address="0x00009888" value="0x0C15C000" />
+        <register type="NOA" address="0x00009888" value="0x0A182000" />
+        <register type="NOA" address="0x00009888" value="0x0E188000" />
+        <register type="NOA" address="0x00009888" value="0x02182000" />
+        <register type="NOA" address="0x00009888" value="0x04182000" />
+        <register type="NOA" address="0x00009888" value="0x06182000" />
+        <register type="NOA" address="0x00009888" value="0x12190400" />
+        <register type="NOA" address="0x00009888" value="0x14190020" />
+        <register type="NOA" address="0x00009888" value="0x0A192000" />
+        <register type="NOA" address="0x00009888" value="0x0C192000" />
+        <register type="NOA" address="0x00009888" value="0x0E192000" />
+        <register type="NOA" address="0x00009888" value="0x0A1C8000" />
+        <register type="NOA" address="0x00009888" value="0x0E1C2000" />
+        <register type="NOA" address="0x00009888" value="0x001C8000" />
+        <register type="NOA" address="0x00009888" value="0x021C8000" />
+        <register type="NOA" address="0x00009888" value="0x041C8000" />
+        <register type="NOA" address="0x00009888" value="0x121D1000" />
+        <register type="NOA" address="0x00009888" value="0x141D0008" />
+        <register type="NOA" address="0x00009888" value="0x081D8000" />
+        <register type="NOA" address="0x00009888" value="0x0A1D8000" />
+        <register type="NOA" address="0x00009888" value="0x0C1D8000" />
+        <register type="NOA" address="0x00009884" value="0x00000003" />
+        <register type="NOA" address="0x00009888" value="0x1A1C01C0" />
+        <register type="NOA" address="0x00009888" value="0x1C1C000A" />
+        <register type="NOA" address="0x00009888" value="0x1A5C01C0" />
+        <register type="NOA" address="0x00009888" value="0x1C5C000A" />
+        <register type="NOA" address="0x00009888" value="0x001C0097" />
+        <register type="NOA" address="0x00009888" value="0x0C1CA700" />
+        <register type="NOA" address="0x00009888" value="0x101C0000" />
+        <register type="NOA" address="0x00009888" value="0x081D0100" />
+        <register type="NOA" address="0x00009888" value="0x0A1D0020" />
+        <register type="NOA" address="0x00009888" value="0x085C0097" />
+        <register type="NOA" address="0x00009888" value="0x0C5C00A7" />
+        <register type="NOA" address="0x00009888" value="0x105C0000" />
+        <register type="NOA" address="0x00009888" value="0x0A5D0011" />
+        <register type="NOA" address="0x00009888" value="0x181E8000" />
+        <register type="NOA" address="0x00009888" value="0x1E1E0300" />
+        <register type="NOA" address="0x00009888" value="0x201E000B" />
+        <register type="NOA" address="0x00009888" value="0x301F4000" />
+        <register type="NOA" address="0x00009888" value="0x501F2124" />
+        <register type="NOA" address="0x00009888" value="0x521F2520" />
+        <register type="NOA" address="0x00009888" value="0x541F0024" />
+        <register type="NOA" address="0x00009888" value="0x3A1F8000" />
+        <register type="NOA" address="0x00009888" value="0x4E1F2430" />
+        <register type="NOA" address="0x00009888" value="0x3E1F0300" />
+        <register type="NOA" address="0x00009888" value="0x461F0300" />
+        <register type="NOA" address="0x00009888" value="0x481F3000" />
+        <register type="NOA" address="0x00009888" value="0x4A1F0300" />
+        <register type="NOA" address="0x00009888" value="0x4C1F0003" />
+        <register type="NOA" address="0x00009888" value="0x141F0000" />
+        <register type="NOA" address="0x00009888" value="0x401F3000" />
+        <register type="NOA" address="0x00009888" value="0x421F3000" />
+        <register type="NOA" address="0x00009888" value="0x441F3000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E65C" value="0xFFFFFFFF" />
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00000003" />
+        <register type="FLEX" address="0x0000E658" value="0x00002001" />
+        <register type="FLEX" address="0x0000E758" value="0x00000008" />
+    </register_config>
+  </set>
+
+  <set name="ComputeExtended Gen11"
+       mdapi_supported_apis="VK OGL OGL4 OCL MEDIA IO BB"
+       underscore_name="compute_extended"
+       hw_config_guid="2ab52087-3700-4db4-8dda-f73b77edfd93"
+       chipset="LKF"
+       symbol_name="ComputeExtended"
+       >
+    <counter name="UntypedWritesPerCacheLine"
+             description="The ratio of EU untyped write requests to L3 cache line writes."
+             data_type="float"
+             equation="B 7 READ B 1 READ FADD C 2 READ FADD C 3 READ FDIV"
+             underscore_name="untyped_writes_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="UntypedWritesPerCacheLine"
+             availability="$SubsliceMask 1 AND"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Eu Typed Atomics 00"
+             description="Slice0 Dualsubslice 0 Eu Typed Atomics"
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="eu_typed_atomics00"
+             units="messages"
+             symbol_name="EuTypedAtomics00"
+             availability="$SubsliceMask 1 AND"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Typed Atomics 00"
+             description="Slice 0 Dualsubslice 0 typed atomics."
+             data_type="uint64"
+             equation="C 7 READ"
+             underscore_name="typed_atomics00"
+             units="messages"
+             symbol_name="TypedAtomics00"
+             availability="$SubsliceMask 1 AND"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="TypedAtomicsPerCacheLine"
+             description="The ratio of EU typed atomics requests to L3 cache line writes."
+             data_type="float"
+             equation="$EuTypedAtomics00 $TypedAtomics00 FDIV"
+             underscore_name="typed_atomics_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="TypedAtomicsPerCacheLine"
+             availability="$SubsliceMask 1 AND"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Eu 64 Untyped Reads 00"
+             description="Slice0 Dualsubslice 0 Eu 64 Untyped Reads"
+             data_type="float"
+             equation="B 5 READ C 1 READ FADD B 6 READ FADD"
+             underscore_name="eu_a64_untyped_reads00"
+             units="messages"
+             symbol_name="EuA64UntypedReads00"
+             availability="$SubsliceMask 1 AND"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Eu A32 Untyped Writes 00"
+             description="Slice0 Dualsubslice 0 Eu A32 Untyped Writes"
+             data_type="uint64"
+             equation="B 7 READ B 1 READ UADD"
+             underscore_name="eu_a32_untyped_writes00"
+             units="messages"
+             symbol_name="EuA32UntypedWrites00"
+             availability="$SubsliceMask 1 AND"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="Eu Typed Reads 00"
+             description="Slice0 Dualsubslice 0 Eu Typed Reads"
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="eu_typed_reads00"
+             units="messages"
+             symbol_name="EuTypedReads00"
+             availability="$SubsliceMask 1 AND"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Eu Typed Writes 00"
+             description="Slice0 Dualsubslice 0 Eu Typed Writes"
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="eu_typed_writes00"
+             units="messages"
+             symbol_name="EuTypedWrites00"
+             availability="$SubsliceMask 1 AND"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Typed Writes 00"
+             description="Slice 0 Dualsubslice 0 typed writes."
+             data_type="uint64"
+             equation="C 5 READ"
+             underscore_name="typed_writes00"
+             units="messages"
+             symbol_name="TypedWrites00"
+             availability="$SubsliceMask 1 AND"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="TypedWritesPerCacheLine"
+             description="The ratio of EU typed write requests to L3 cache line writes."
+             data_type="float"
+             equation="$EuTypedWrites00 $TypedWrites00 FDIV"
+             underscore_name="typed_writes_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="TypedWritesPerCacheLine"
+             availability="$SubsliceMask 1 AND"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Untyped Writes 00"
+             description="Slice 0 Dualsubslice 0 untyped writes (including SLM writes)."
+             data_type="uint64"
+             equation="C 3 READ"
+             underscore_name="untyped_writes00"
+             units="messages"
+             symbol_name="UntypedWrites00"
+             availability="$SubsliceMask 1 AND"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Untyped Reads 00"
+             description="Slice 0 Dualsubslice 0 untyped reads (including SLM reads)."
+             data_type="uint64"
+             equation="C 4 READ"
+             underscore_name="untyped_reads00"
+             units="messages"
+             symbol_name="UntypedReads00"
+             availability="$SubsliceMask 1 AND"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Eu A64 Untyped Writes 00"
+             description="Slice0 Dualsubslice 0 Eu A64 Untyped Writes"
+             data_type="uint64"
+             equation="C 2 READ"
+             underscore_name="eu_a64_untyped_writes00"
+             units="messages"
+             symbol_name="EuA64UntypedWrites00"
+             availability="$SubsliceMask 1 AND"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="UntypedReadsPerCacheLine"
+             description="The ratio of EU untyped read requests to L3 cache line reads."
+             data_type="float"
+             equation="B 0 READ B 5 READ C 1 READ FADD B 6 READ FADD FADD C 4 READ FDIV"
+             underscore_name="untyped_reads_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="UntypedReadsPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Typed Reads 00"
+             description="Slice 0 Dualsubslice 0 typed reads."
+             data_type="uint64"
+             equation="C 6 READ"
+             underscore_name="typed_reads00"
+             units="messages"
+             symbol_name="TypedReads00"
+             availability="$SubsliceMask 1 AND"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="TypedReadsPerCacheLine"
+             description="The ratio of EU typed read requests to L3 cache line reads."
+             data_type="float"
+             equation="$EuTypedReads00 $TypedReads00 FDIV"
+             underscore_name="typed_reads_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="TypedReadsPerCacheLine"
+             availability="$SubsliceMask 1 AND"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Eu A32 Untyped Reads 00"
+             description="Slice0 Dualsubslice 0 Eu A32 Untyped Reads"
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="eu_a32_untyped_reads00"
+             units="messages"
+             symbol_name="EuA32UntypedReads00"
+             availability="$SubsliceMask 1 AND"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009840" value="0x00000000" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x14210160" />
+        <register type="NOA" address="0x00009888" value="0x18210120" />
+        <register type="NOA" address="0x00009888" value="0x12230019" />
+        <register type="NOA" address="0x00009888" value="0x10230012" />
+        <register type="NOA" address="0x00009888" value="0x101E8000" />
+        <register type="NOA" address="0x00009888" value="0x1C1EE000" />
+        <register type="NOA" address="0x00009888" value="0x1E1E001F" />
+        <register type="NOA" address="0x00009888" value="0x00204000" />
+        <register type="NOA" address="0x00009888" value="0x0E204000" />
+        <register type="NOA" address="0x00009888" value="0x18204000" />
+        <register type="NOA" address="0x00009888" value="0x1A205550" />
+        <register type="NOA" address="0x00009888" value="0x04208000" />
+        <register type="NOA" address="0x00009888" value="0x06208000" />
+        <register type="NOA" address="0x00009888" value="0x08208000" />
+        <register type="NOA" address="0x00009888" value="0x0A208000" />
+        <register type="NOA" address="0x00009888" value="0x0C208000" />
+        <register type="NOA" address="0x00009888" value="0x00210041" />
+        <register type="NOA" address="0x00009888" value="0x06214200" />
+        <register type="NOA" address="0x00009888" value="0x08214443" />
+        <register type="NOA" address="0x00009888" value="0x0A214645" />
+        <register type="NOA" address="0x00009888" value="0x0C217647" />
+        <register type="NOA" address="0x00009888" value="0x0E210073" />
+        <register type="NOA" address="0x00009888" value="0x1E210000" />
+        <register type="NOA" address="0x00009888" value="0x10210000" />
+        <register type="NOA" address="0x00009888" value="0x02231AB4" />
+        <register type="NOA" address="0x00009888" value="0x04231DBA" />
+        <register type="NOA" address="0x00009888" value="0x06230039" />
+        <register type="NOA" address="0x00009888" value="0x00230000" />
+        <register type="NOA" address="0x00009888" value="0x0C044400" />
+        <register type="NOA" address="0x00009888" value="0x0E045555" />
+        <register type="NOA" address="0x00009888" value="0x10040055" />
+        <register type="NOA" address="0x00009888" value="0x04051000" />
+        <register type="NOA" address="0x00009888" value="0x0A055000" />
+        <register type="NOA" address="0x00009888" value="0x0C055000" />
+        <register type="NOA" address="0x00009888" value="0x0E055000" />
+        <register type="NOA" address="0x00009888" value="0x14050015" />
+        <register type="NOA" address="0x00009888" value="0x06055000" />
+        <register type="NOA" address="0x00009888" value="0x08055000" />
+        <register type="NOA" address="0x00009888" value="0x2406FD00" />
+        <register type="NOA" address="0x00009888" value="0x2606007F" />
+        <register type="NOA" address="0x00009888" value="0x0015C000" />
+        <register type="NOA" address="0x00009888" value="0x0E15C000" />
+        <register type="NOA" address="0x00009888" value="0x16157FF8" />
+        <register type="NOA" address="0x00009888" value="0x18150003" />
+        <register type="NOA" address="0x00009888" value="0x0415C000" />
+        <register type="NOA" address="0x00009888" value="0x0615C000" />
+        <register type="NOA" address="0x00009888" value="0x0815C000" />
+        <register type="NOA" address="0x00009888" value="0x0A15C000" />
+        <register type="NOA" address="0x00009888" value="0x0C15C000" />
+        <register type="NOA" address="0x00009888" value="0x00182000" />
+        <register type="NOA" address="0x00009888" value="0x0618A000" />
+        <register type="NOA" address="0x00009888" value="0x0818A000" />
+        <register type="NOA" address="0x00009888" value="0x0A18A000" />
+        <register type="NOA" address="0x00009888" value="0x0C18A000" />
+        <register type="NOA" address="0x00009888" value="0x0E182000" />
+        <register type="NOA" address="0x00009888" value="0x0218A000" />
+        <register type="NOA" address="0x00009888" value="0x0418A000" />
+        <register type="NOA" address="0x00009888" value="0x08192000" />
+        <register type="NOA" address="0x00009888" value="0x0E19A000" />
+        <register type="NOA" address="0x00009888" value="0x12195540" />
+        <register type="NOA" address="0x00009888" value="0x1419000A" />
+        <register type="NOA" address="0x00009888" value="0x0A19A000" />
+        <register type="NOA" address="0x00009888" value="0x0C19A000" />
+        <register type="NOA" address="0x00009884" value="0x00000003" />
+        <register type="NOA" address="0x00009888" value="0x18130343" />
+        <register type="NOA" address="0x00009888" value="0x22000008" />
+        <register type="NOA" address="0x00009888" value="0x12008000" />
+        <register type="NOA" address="0x00009888" value="0x0E137300" />
+        <register type="NOA" address="0x00009888" value="0x00137B00" />
+        <register type="NOA" address="0x00009888" value="0x10130000" />
+        <register type="NOA" address="0x00009888" value="0x1E130000" />
+        <register type="NOA" address="0x00009888" value="0x1C130000" />
+        <register type="NOA" address="0x00009888" value="0x0E168000" />
+        <register type="NOA" address="0x00009888" value="0x00168000" />
+        <register type="NOA" address="0x00009888" value="0x1A1A0010" />
+        <register type="NOA" address="0x00009888" value="0x021A4000" />
+        <register type="NOA" address="0x00009888" value="0x301F8000" />
+        <register type="NOA" address="0x00009888" value="0x501F4924" />
+        <register type="NOA" address="0x00009888" value="0x521F4924" />
+        <register type="NOA" address="0x00009888" value="0x541F000C" />
+        <register type="NOA" address="0x00009888" value="0x3A1F2000" />
+        <register type="NOA" address="0x00009888" value="0x4E1F2441" />
+        <register type="NOA" address="0x00009888" value="0x3E1F0000" />
+        <register type="NOA" address="0x00009888" value="0x461F0000" />
+        <register type="NOA" address="0x00009888" value="0x481F0000" />
+        <register type="NOA" address="0x00009888" value="0x4A1F0000" />
+        <register type="NOA" address="0x00009888" value="0x4C1F0000" />
+        <register type="NOA" address="0x00009888" value="0x141F0000" />
+        <register type="NOA" address="0x00009888" value="0x401F1041" />
+        <register type="NOA" address="0x00009888" value="0x421F1010" />
+        <register type="NOA" address="0x00009888" value="0x441F1010" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002770" value="0x30000036" />
+        <register type="OA" address="0x00002774" value="0x01FFFE00" />
+        <register type="OA" address="0x00002778" value="0x31000034" />
+        <register type="OA" address="0x0000277C" value="0x01FFFE00" />
+        <register type="OA" address="0x00002780" value="0x00000C9A" />
+        <register type="OA" address="0x00002784" value="0x0000FE00" />
+        <register type="OA" address="0x00002788" value="0x00000C92" />
+        <register type="OA" address="0x0000278C" value="0x0000FE00" />
+        <register type="OA" address="0x00002790" value="0x00000CA2" />
+        <register type="OA" address="0x00002794" value="0x0000FE00" />
+        <register type="OA" address="0x00002798" value="0x00000E42" />
+        <register type="OA" address="0x0000279C" value="0x0000FE00" />
+        <register type="OA" address="0x000027A0" value="0x00000E6A" />
+        <register type="OA" address="0x000027A4" value="0x0000FE00" />
+        <register type="OA" address="0x000027A8" value="0x00000C32" />
+        <register type="OA" address="0x000027AC" value="0x0000FE00" />
+        <register type="OA" address="0x0000274C" value="0x87643210" />
+        <register type="OA" address="0x00002744" value="0x00001811" />
+        <register type="OA" address="0x00002748" value="0x87654310" />
+    </register_config>
+  </set>
+
+  <set name="Compute Metrics L3 Cache Gen11"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="compute_l3_cache"
+       hw_config_guid="498aa71d-ae5c-4523-a246-33fb2769a386"
+       chipset="LKF"
+       symbol_name="ComputeL3Cache"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank3 Accesses"
+             description="The total number of accesses to Slice0 L3 Bank3."
+             data_type="uint64"
+             equation="C 4 READ 2 UMUL"
+             underscore_name="l3_bank03_accesses"
+             units="messages"
+             symbol_name="L3Bank03Accesses"
+             availability="$SliceMask 1 AND"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="Slice0 L3 Bank0 Accesses"
+             description="The total number of accesses to Slice0 L3 Bank0."
+             data_type="uint64"
+             equation="C 7 READ 2 UMUL"
+             underscore_name="l3_bank00_accesses"
+             units="messages"
+             symbol_name="L3Bank00Accesses"
+             availability="$SliceMask 1 AND"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="Slice0 L3 Bank1 Accesses"
+             description="The total number of accesses to Slice0 L3 Bank1."
+             data_type="uint64"
+             equation="C 6 READ 2 UMUL"
+             underscore_name="l3_bank01_accesses"
+             units="messages"
+             symbol_name="L3Bank01Accesses"
+             availability="$SliceMask 1 AND"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="Slice0 L3 Bank2 Accesses"
+             description="The total number of accesses to Slice0 L3 Bank2."
+             data_type="uint64"
+             equation="C 5 READ 2 UMUL"
+             underscore_name="l3_bank02_accesses"
+             units="messages"
+             symbol_name="L3Bank02Accesses"
+             availability="$SliceMask 1 AND"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="Slice0 L3 Bank4 Accesses"
+             description="The total number of accesses to Slice0 L3 Bank4."
+             data_type="uint64"
+             equation="C 3 READ 2 UMUL"
+             underscore_name="l3_bank04_accesses"
+             units="messages"
+             symbol_name="L3Bank04Accesses"
+             availability="$SliceMask 1 AND"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="Slice0 L3 Bank5 Accesses"
+             description="The total number of accesses to Slice0 L3 Bank5."
+             data_type="uint64"
+             equation="C 2 READ 2 UMUL"
+             underscore_name="l3_bank05_accesses"
+             units="messages"
+             symbol_name="L3Bank05Accesses"
+             availability="$SliceMask 1 AND"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="Slice0 L3 Bank6 Accesses"
+             description="The total number of accesses to Slice0 L3 Bank6."
+             data_type="uint64"
+             equation="C 1 READ 2 UMUL"
+             underscore_name="l3_bank06_accesses"
+             units="messages"
+             symbol_name="L3Bank06Accesses"
+             availability="$SliceMask 1 AND"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="Slice0 L3 Bank7 Accesses"
+             description="The total number of accesses to Slice0 L3 Bank7."
+             data_type="uint64"
+             equation="C 0 READ 2 UMUL"
+             underscore_name="l3_bank07_accesses"
+             units="messages"
+             symbol_name="L3Bank07Accesses"
+             availability="$SliceMask 1 AND"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="L3 Accesses"
+             description="The total number of L3 accesses from all entities."
+             data_type="uint64"
+             equation="$L3Bank00Accesses $L3Bank01Accesses UADD $L3Bank02Accesses UADD $L3Bank03Accesses UADD $L3Bank04Accesses UADD $L3Bank05Accesses UADD $L3Bank06Accesses UADD $L3Bank07Accesses UADD"
+             underscore_name="l3_accesses"
+             units="messages"
+             symbol_name="L3Accesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Sampler Throughput"
+             description="The total number of GPU memory bytes transferred between samplers and L3 caches."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="64  B 7 READ B 6 READ UADD 2 UMUL UMUL"
+             underscore_name="l3_sampler_throughput"
+             units="bytes"
+             symbol_name="L3SamplerThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Sampler"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU AVG IPC Rate"
+             description="The average rate of IPC calculated for 2 FPU pipelines."
+             data_type="float"
+             max_equation="2"
+             equation="A 9 READ A 10 READ A 11 READ FADD A 9 READ FSUB FDIV 1 FADD"
+             underscore_name="eu_avg_ipc_rate"
+             units="number"
+             symbol_name="EuAvgIpcRate"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Binary Instruction"
+             description="The percentage of time in which execution units were actively processing binary instructions on FPU0."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_binary_fpu0_instruction"
+             units="percent"
+             symbol_name="EuBinaryFpu0Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="EU FPU0 Hybrid Instruction"
+             description="The percentage of time in which execution units were actively processing hybrid instructions on FPU0."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_hybrid_fpu0_instruction"
+             units="percent"
+             symbol_name="EuHybridFpu0Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active"
+             units="percent"
+             symbol_name="Fpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu0_active"
+             units="percent"
+             symbol_name="Fpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="L3 Misses"
+             description="The total number of L3 misses."
+             data_type="uint64"
+             equation="2 B 5 READ B 4 READ UADD UMUL"
+             underscore_name="l3_misses"
+             units="messages"
+             symbol_name="L3Misses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/TAG"
+             />
+    <counter name="EU FPU0 Move Instruction"
+             description="The percentage of time in which execution units were actively processing move instructions on FPU0."
+             data_type="float"
+             max_equation="100"
+             equation="A 19 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_move_fpu0_instruction"
+             units="percent"
+             symbol_name="EuMoveFpu0Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Accesses"
+             description="The total number of messages send to samplers."
+             data_type="uint64"
+             equation="A 28 READ"
+             underscore_name="sampler_accesses"
+             units="messages"
+             symbol_name="SamplerAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="$SamplerAccesses 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU FPU1 Hybrid Instruction"
+             description="The percentage of time in which execution units were actively processing hybrid instructions on FPU1."
+             data_type="float"
+             max_equation="100"
+             equation="A 14 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_hybrid_fpu1_instruction"
+             units="percent"
+             symbol_name="EuHybridFpu1Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="L3 Lookup Accesses w/o IC"
+             description="The total number of L3 cache lookup accesses w/o IC."
+             data_type="uint64"
+             equation="B 7 READ B 6 READ UADD 2 UMUL A 32 READ UADD"
+             underscore_name="l3_lookups"
+             units="messages"
+             symbol_name="L3Lookups"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/TAG"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Read Throughput"
+             description="The total number of GPU memory bytes read from GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="B 2 READ 64 UMUL"
+             underscore_name="gti_read_throughput"
+             units="bytes"
+             symbol_name="GtiReadThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Ternary Instruction"
+             description="The percentage of time in which execution units were actively processing ternary instructions on FPU0."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_ternary_fpu0_instruction"
+             units="percent"
+             symbol_name="EuTernaryFpu0Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="GTI L3 Throughput"
+             description="The total number of GPU memory bytes transferred between L3 caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="$L3Misses 64 UMUL"
+             underscore_name="gti_l3_throughput"
+             units="bytes"
+             symbol_name="GtiL3Throughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU FPU1 Move Instruction"
+             description="The percentage of time in which execution units were actively processing move instructions on FPU1."
+             data_type="float"
+             max_equation="100"
+             equation="A 20 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_move_fpu1_instruction"
+             units="percent"
+             symbol_name="EuMoveFpu1Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="L3 Total Throughput"
+             description="The total number of GPU memory bytes transferred via L3."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="$L3Accesses 64 UMUL"
+             underscore_name="l3_total_throughput"
+             units="bytes"
+             symbol_name="L3TotalThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Write Throughput"
+             description="The total number of GPU memory bytes written to GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="B 3 READ 64 UMUL"
+             underscore_name="gti_write_throughput"
+             units="bytes"
+             symbol_name="GtiWriteThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ A 31 READ UADD A 32 READ UADD 64 UMUL"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Binary Instruction"
+             description="The percentage of time in which execution units were actively processing binary instructions on FPU1."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_binary_fpu1_instruction"
+             units="percent"
+             symbol_name="EuBinaryFpu1Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Ternary Instruction"
+             description="The percentage of time in which execution units were actively processing ternary instructions on FPU1."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_ternary_fpu1_instruction"
+             units="percent"
+             symbol_name="EuTernaryFpu1Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_send_active"
+             units="percent"
+             symbol_name="EuSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009840" value="0x00000000" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x14120700" />
+        <register type="NOA" address="0x00009888" value="0x121500E0" />
+        <register type="NOA" address="0x00009888" value="0x10040154" />
+        <register type="NOA" address="0x00009888" value="0x0C045000" />
+        <register type="NOA" address="0x00009888" value="0x0E040055" />
+        <register type="NOA" address="0x00009888" value="0x14050055" />
+        <register type="NOA" address="0x00009888" value="0x04054000" />
+        <register type="NOA" address="0x00009888" value="0x06055000" />
+        <register type="NOA" address="0x00009888" value="0x08055000" />
+        <register type="NOA" address="0x00009888" value="0x0A051000" />
+        <register type="NOA" address="0x00009888" value="0x260600F0" />
+        <register type="NOA" address="0x00009888" value="0x24067E00" />
+        <register type="NOA" address="0x00009888" value="0x0C120023" />
+        <register type="NOA" address="0x00009888" value="0x0E12152B" />
+        <register type="NOA" address="0x00009888" value="0x00121480" />
+        <register type="NOA" address="0x00009888" value="0x02120028" />
+        <register type="NOA" address="0x00009888" value="0x10120000" />
+        <register type="NOA" address="0x00009888" value="0x18120000" />
+        <register type="NOA" address="0x00009888" value="0x1A120000" />
+        <register type="NOA" address="0x00009888" value="0x04120000" />
+        <register type="NOA" address="0x00009888" value="0x0A13D000" />
+        <register type="NOA" address="0x00009888" value="0x04136000" />
+        <register type="NOA" address="0x00009888" value="0x0C144000" />
+        <register type="NOA" address="0x00009888" value="0x0E14C000" />
+        <register type="NOA" address="0x00009888" value="0x00148000" />
+        <register type="NOA" address="0x00009888" value="0x02144000" />
+        <register type="NOA" address="0x00009888" value="0x0C150980" />
+        <register type="NOA" address="0x00009888" value="0x02154D80" />
+        <register type="NOA" address="0x00009888" value="0x04154C9A" />
+        <register type="NOA" address="0x00009888" value="0x06150018" />
+        <register type="NOA" address="0x00009888" value="0x10150000" />
+        <register type="NOA" address="0x00009888" value="0x16150800" />
+        <register type="NOA" address="0x00009888" value="0x18150005" />
+        <register type="NOA" address="0x00009888" value="0x08150000" />
+        <register type="NOA" address="0x00009888" value="0x0A150000" />
+        <register type="NOA" address="0x00009884" value="0x00000003" />
+        <register type="NOA" address="0x00009888" value="0x0A1473A0" />
+        <register type="NOA" address="0x00009888" value="0x1217241C" />
+        <register type="NOA" address="0x00009888" value="0x2000F000" />
+        <register type="NOA" address="0x00009888" value="0x1C134000" />
+        <register type="NOA" address="0x00009888" value="0x1E130015" />
+        <register type="NOA" address="0x00009888" value="0x061434A0" />
+        <register type="NOA" address="0x00009888" value="0x0E140000" />
+        <register type="NOA" address="0x00009888" value="0x0C143000" />
+        <register type="NOA" address="0x00009888" value="0x0816C000" />
+        <register type="NOA" address="0x00009888" value="0x0A16C000" />
+        <register type="NOA" address="0x00009888" value="0x081710B0" />
+        <register type="NOA" address="0x00009888" value="0x00170000" />
+        <register type="NOA" address="0x00009888" value="0x161A2000" />
+        <register type="NOA" address="0x00009888" value="0x181A1500" />
+        <register type="NOA" address="0x00009888" value="0x501F1124" />
+        <register type="NOA" address="0x00009888" value="0x521F4849" />
+        <register type="NOA" address="0x00009888" value="0x541F0024" />
+        <register type="NOA" address="0x00009888" value="0x3A1F8000" />
+        <register type="NOA" address="0x00009888" value="0x4E1F2400" />
+        <register type="NOA" address="0x00009888" value="0x461F0100" />
+        <register type="NOA" address="0x00009888" value="0x481F1101" />
+        <register type="NOA" address="0x00009888" value="0x4A1F0011" />
+        <register type="NOA" address="0x00009888" value="0x4C1F0030" />
+        <register type="NOA" address="0x00009888" value="0x141F0000" />
+        <register type="NOA" address="0x00009888" value="0x301F0000" />
+        <register type="NOA" address="0x00009888" value="0x401F0000" />
+        <register type="NOA" address="0x00009888" value="0x421F3030" />
+        <register type="NOA" address="0x00009888" value="0x441F3030" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00000003" />
+        <register type="FLEX" address="0x0000E658" value="0x00002001" />
+        <register type="FLEX" address="0x0000E758" value="0x00101100" />
+        <register type="FLEX" address="0x0000E45C" value="0x00201200" />
+        <register type="FLEX" address="0x0000E55C" value="0x00301300" />
+        <register type="FLEX" address="0x0000E65C" value="0x00401400" />
+    </register_config>
+  </set>
+
+  <set name="Render Metrics for 3D Pipeline Profile Gen11"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="render_pipe_profile"
+       hw_config_guid="045dbb74-1e1a-499c-9a50-bac498e34699"
+       chipset="LKF"
+       symbol_name="RenderPipeProfile"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Bottleneck"
+             low_watermark="10"
+             description="The percentage of time in which vertex shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="30"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="vs_bottleneck"
+             units="percent"
+             symbol_name="VsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Hi-Depth Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which early hierarchical depth test pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="B 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="hi_depth_bottleneck"
+             units="percent"
+             symbol_name="HiDepthBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which geometry shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="C 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="gs_bottleneck"
+             units="percent"
+             symbol_name="GsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Geometry Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="BC Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which barycentric coordinates calculation pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="B 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="bc_bottleneck"
+             units="percent"
+             symbol_name="BcBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Barycentric Calc"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HS Stall"
+             description="The percentage of time in which hull stall pipeline stage was stalled."
+             data_type="float"
+             max_equation="100"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="hs_stall"
+             units="percent"
+             symbol_name="HsStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_group="3D Pipe/Hull Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="VF Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which vertex fetch pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="vf_bottleneck"
+             units="percent"
+             symbol_name="VfBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Input Assembler"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Strip-Fans Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which strip-fans pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="10"
+             equation="C 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="sf_bottleneck"
+             units="percent"
+             symbol_name="SfBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Strip-Fans"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SF Stall"
+             description="The percentage of time in which strip-fans pipeline stage was stalled."
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sf_stall"
+             units="percent"
+             symbol_name="SfStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Strip-Fans"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HS Bottleneck"
+             low_watermark="3"
+             description="The percentage of time in which hull shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="9"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="hs_bottleneck"
+             units="percent"
+             symbol_name="HsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Hull Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="CL Stall"
+             description="The percentage of time in which clipper pipeline stage was stalled."
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="cl_stall"
+             units="percent"
+             symbol_name="ClStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_group="3D Pipe/Clipper"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SO Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which stream output pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="C 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="so_bottleneck"
+             units="percent"
+             symbol_name="SoBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Stream Output"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="DS Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which domain shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="ds_bottleneck"
+             units="percent"
+             symbol_name="DsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Domain Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Clipper Bottleneck"
+             low_watermark="10"
+             description="The percentage of time in which clipper pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="30"
+             equation="C 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="cl_bottleneck"
+             units="percent"
+             symbol_name="ClBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Clipper"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Stall"
+             description="The percentage of time in which domain shader pipeline stage was stalled."
+             data_type="float"
+             max_equation="100"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ds_stall"
+             units="percent"
+             symbol_name="DsStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_group="3D Pipe/Domain Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Early Depth Bottleneck"
+             low_watermark="10"
+             description="The percentage of time in which early depth test pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="30"
+             equation="B 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="early_depth_bottleneck"
+             units="percent"
+             symbol_name="EarlyDepthBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ A 31 READ UADD A 32 READ UADD 64 UMUL"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SO Stall"
+             description="The percentage of time in which stream-output pipeline stage was stalled."
+             data_type="float"
+             max_equation="100"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="so_stall"
+             units="percent"
+             symbol_name="SoStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_group="3D Pipe/Stream Output"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009840" value="0x00000000" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x101E001E" />
+        <register type="NOA" address="0x00009888" value="0x10160000" />
+        <register type="NOA" address="0x00009888" value="0x1017001F" />
+        <register type="NOA" address="0x00009888" value="0x0A1E0500" />
+        <register type="NOA" address="0x00009888" value="0x1E1E0000" />
+        <register type="NOA" address="0x00009888" value="0x1A200100" />
+        <register type="NOA" address="0x00009888" value="0x10040015" />
+        <register type="NOA" address="0x00009888" value="0x0E054000" />
+        <register type="NOA" address="0x00009888" value="0x14050005" />
+        <register type="NOA" address="0x00009888" value="0x26060038" />
+        <register type="NOA" address="0x00009888" value="0x16157E00" />
+        <register type="NOA" address="0x00009888" value="0x0C160022" />
+        <register type="NOA" address="0x00009888" value="0x08160000" />
+        <register type="NOA" address="0x00009888" value="0x0C170540" />
+        <register type="NOA" address="0x00009888" value="0x04170000" />
+        <register type="NOA" address="0x00009888" value="0x0A188000" />
+        <register type="NOA" address="0x00009888" value="0x0C181000" />
+        <register type="NOA" address="0x00009888" value="0x12195000" />
+        <register type="NOA" address="0x00009888" value="0x14190001" />
+        <register type="NOA" address="0x00009884" value="0x00000003" />
+        <register type="NOA" address="0x00009888" value="0x100A0019" />
+        <register type="NOA" address="0x00009888" value="0x140A001F" />
+        <register type="NOA" address="0x00009888" value="0x180B0000" />
+        <register type="NOA" address="0x00009888" value="0x160C0000" />
+        <register type="NOA" address="0x00009888" value="0x1C020000" />
+        <register type="NOA" address="0x00009888" value="0x1806801F" />
+        <register type="NOA" address="0x00009888" value="0x1007001E" />
+        <register type="NOA" address="0x00009888" value="0x12080000" />
+        <register type="NOA" address="0x00009888" value="0x0A0A0047" />
+        <register type="NOA" address="0x00009888" value="0x020A0002" />
+        <register type="NOA" address="0x00009888" value="0x040A0043" />
+        <register type="NOA" address="0x00009888" value="0x200A0000" />
+        <register type="NOA" address="0x00009888" value="0x1E0A0000" />
+        <register type="NOA" address="0x00009888" value="0x180A0000" />
+        <register type="NOA" address="0x00009888" value="0x1A0A8000" />
+        <register type="NOA" address="0x00009888" value="0x080B3100" />
+        <register type="NOA" address="0x00009888" value="0x020B3200" />
+        <register type="NOA" address="0x00009888" value="0x100B0000" />
+        <register type="NOA" address="0x00009888" value="0x040C2900" />
+        <register type="NOA" address="0x00009888" value="0x000C0000" />
+        <register type="NOA" address="0x00009888" value="0x100200B1" />
+        <register type="NOA" address="0x00009888" value="0x020200B3" />
+        <register type="NOA" address="0x00009888" value="0x08020000" />
+        <register type="NOA" address="0x00009888" value="0x00020000" />
+        <register type="NOA" address="0x00009888" value="0x00034000" />
+        <register type="NOA" address="0x00009888" value="0x08038000" />
+        <register type="NOA" address="0x00009888" value="0x0E034000" />
+        <register type="NOA" address="0x00009888" value="0x02038000" />
+        <register type="NOA" address="0x00009888" value="0x1C04FFB6" />
+        <register type="NOA" address="0x00009888" value="0x1E04E039" />
+        <register type="NOA" address="0x00009888" value="0x0C059000" />
+        <register type="NOA" address="0x00009888" value="0x10050042" />
+        <register type="NOA" address="0x00009888" value="0x06060095" />
+        <register type="NOA" address="0x00009888" value="0x1E060084" />
+        <register type="NOA" address="0x00009888" value="0x1C068000" />
+        <register type="NOA" address="0x00009888" value="0x14068000" />
+        <register type="NOA" address="0x00009888" value="0x1A068000" />
+        <register type="NOA" address="0x00009888" value="0x00070022" />
+        <register type="NOA" address="0x00009888" value="0x0E070023" />
+        <register type="NOA" address="0x00009888" value="0x08078000" />
+        <register type="NOA" address="0x00009888" value="0x02078000" />
+        <register type="NOA" address="0x00009888" value="0x06080100" />
+        <register type="NOA" address="0x00009888" value="0x0E080300" />
+        <register type="NOA" address="0x00009888" value="0x1C080004" />
+        <register type="NOA" address="0x00009888" value="0x1A082000" />
+        <register type="NOA" address="0x00009888" value="0x14088000" />
+        <register type="NOA" address="0x00009888" value="0x18088000" />
+        <register type="NOA" address="0x00009888" value="0x1C090800" />
+        <register type="NOA" address="0x00009888" value="0x16098000" />
+        <register type="NOA" address="0x00009888" value="0x301F6000" />
+        <register type="NOA" address="0x00009888" value="0x501F36DB" />
+        <register type="NOA" address="0x00009888" value="0x521F491B" />
+        <register type="NOA" address="0x00009888" value="0x541F001B" />
+        <register type="NOA" address="0x00009888" value="0x3A1F6000" />
+        <register type="NOA" address="0x00009888" value="0x4E1F1B41" />
+        <register type="NOA" address="0x00009888" value="0x3E1F3100" />
+        <register type="NOA" address="0x00009888" value="0x461F5141" />
+        <register type="NOA" address="0x00009888" value="0x481F3111" />
+        <register type="NOA" address="0x00009888" value="0x4A1F1000" />
+        <register type="NOA" address="0x00009888" value="0x4C1F3120" />
+        <register type="NOA" address="0x00009888" value="0x141F0000" />
+        <register type="NOA" address="0x00009888" value="0x401F3151" />
+        <register type="NOA" address="0x00009888" value="0x421F3111" />
+        <register type="NOA" address="0x00009888" value="0x441F5121" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+    </register_config>
+  </set>
+
+  <set name="Metric set HDCAndSF"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="hdc_and_sf"
+       hw_config_guid="63af815c-30f9-4dd5-81fa-351ad6b69b4b"
+       chipset="LKF"
+       symbol_name="HDCAndSF"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="Polygon Data Ready"
+             description="The percentage of time in which geometry pipeline output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="poly_data_ready"
+             units="percent"
+             symbol_name="PolyDataReady"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe/Strip-Fans"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="Slice0 Dualsubslice1 Non-sampler Shader Access Stalled On L3"
+             description="Percentage of time when HDC has messages to L3, but it's stalled due to lack of credits (Slice0 Dualsubslice1)"
+             data_type="float"
+             max_equation="100"
+             equation="C 2 READ C 1 READ FSUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader01_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader01AccessStalledOnL3"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="Slice0 Dualsubslice2 Non-sampler Shader Access Stalled On L3"
+             description="Percentage of time when HDC has messages to L3, but it's stalled due to lack of credits (Slice0 Dualsubslice2)"
+             data_type="float"
+             max_equation="100"
+             equation="C 4 READ C 3 READ FSUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader02_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader02AccessStalledOnL3"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ A 31 READ UADD A 32 READ UADD 64 UMUL"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Slice0 Dualsubslice0 Non-sampler Shader Access Stalled On L3"
+             description="Percentage of time when HDC has messages to L3, but it's stalled due to lack of credits (Slice0 Dualsubslice0)"
+             data_type="float"
+             max_equation="100"
+             equation="C 0 READ B 7 READ FSUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader00_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader00AccessStalledOnL3"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 Dualsubslice3 Non-sampler Shader Access Stalled On L3"
+             description="Percentage of time when HDC has messages to L3, but it's stalled due to lack of credits (Slice0 Dualsubslice3)"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ C 5 READ FSUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader03_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader03AccessStalledOnL3"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009840" value="0x00000000" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x1223000A" />
+        <register type="NOA" address="0x00009888" value="0x10230009" />
+        <register type="NOA" address="0x00009888" value="0x1263000A" />
+        <register type="NOA" address="0x00009888" value="0x10630009" />
+        <register type="NOA" address="0x00009888" value="0x12A3000A" />
+        <register type="NOA" address="0x00009888" value="0x10A30009" />
+        <register type="NOA" address="0x00009888" value="0x12E3000A" />
+        <register type="NOA" address="0x00009888" value="0x10E30009" />
+        <register type="NOA" address="0x00009888" value="0x10150019" />
+        <register type="NOA" address="0x00009888" value="0x1A20A000" />
+        <register type="NOA" address="0x00009888" value="0x0C231900" />
+        <register type="NOA" address="0x00009888" value="0x0E23003C" />
+        <register type="NOA" address="0x00009888" value="0x00230000" />
+        <register type="NOA" address="0x00009888" value="0x1C600002" />
+        <register type="NOA" address="0x00009888" value="0x02608000" />
+        <register type="NOA" address="0x00009888" value="0x0E631900" />
+        <register type="NOA" address="0x00009888" value="0x00631E00" />
+        <register type="NOA" address="0x00009888" value="0x04A08000" />
+        <register type="NOA" address="0x00009888" value="0x06A08000" />
+        <register type="NOA" address="0x00009888" value="0x02A31E32" />
+        <register type="NOA" address="0x00009888" value="0x00A30000" />
+        <register type="NOA" address="0x00009888" value="0x08E08000" />
+        <register type="NOA" address="0x00009888" value="0x0AE08000" />
+        <register type="NOA" address="0x00009888" value="0x04E31E32" />
+        <register type="NOA" address="0x00009888" value="0x00E30000" />
+        <register type="NOA" address="0x00009888" value="0x0C045400" />
+        <register type="NOA" address="0x00009888" value="0x10040150" />
+        <register type="NOA" address="0x00009888" value="0x0E040015" />
+        <register type="NOA" address="0x00009888" value="0x04055000" />
+        <register type="NOA" address="0x00009888" value="0x14050054" />
+        <register type="NOA" address="0x00009888" value="0x06055000" />
+        <register type="NOA" address="0x00009888" value="0x08055000" />
+        <register type="NOA" address="0x00009888" value="0x24063F00" />
+        <register type="NOA" address="0x00009888" value="0x260600E0" />
+        <register type="NOA" address="0x00009888" value="0x0E088000" />
+        <register type="NOA" address="0x00009888" value="0x00088000" />
+        <register type="NOA" address="0x00009888" value="0x14090040" />
+        <register type="NOA" address="0x00009888" value="0x04094000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x080E5000" />
+        <register type="NOA" address="0x00009888" value="0x1A120020" />
+        <register type="NOA" address="0x00009888" value="0x02128000" />
+        <register type="NOA" address="0x00009888" value="0x0412C000" />
+        <register type="NOA" address="0x00009888" value="0x0612C000" />
+        <register type="NOA" address="0x00009888" value="0x0A138000" />
+        <register type="NOA" address="0x00009888" value="0x0413E000" />
+        <register type="NOA" address="0x00009888" value="0x0E148000" />
+        <register type="NOA" address="0x00009888" value="0x00148000" />
+        <register type="NOA" address="0x00009888" value="0x0214C000" />
+        <register type="NOA" address="0x00009888" value="0x00150047" />
+        <register type="NOA" address="0x00009888" value="0x16156000" />
+        <register type="NOA" address="0x00009888" value="0x18150007" />
+        <register type="NOA" address="0x00009888" value="0x02154000" />
+        <register type="NOA" address="0x00009888" value="0x04154000" />
+        <register type="NOA" address="0x00009888" value="0x06154000" />
+        <register type="NOA" address="0x00009888" value="0x08158000" />
+        <register type="NOA" address="0x00009888" value="0x0A158000" />
+        <register type="NOA" address="0x00009888" value="0x0C188000" />
+        <register type="NOA" address="0x00009888" value="0x0E182000" />
+        <register type="NOA" address="0x00009888" value="0x1419000A" />
+        <register type="NOA" address="0x00009888" value="0x021CA000" />
+        <register type="NOA" address="0x00009888" value="0x0A1DA000" />
+        <register type="NOA" address="0x00009884" value="0x00000003" />
+        <register type="NOA" address="0x00009888" value="0x1C1F3061" />
+        <register type="NOA" address="0x00009888" value="0x141F0000" />
+        <register type="NOA" address="0x00009888" value="0x301F8000" />
+        <register type="NOA" address="0x00009888" value="0x521F4000" />
+        <register type="NOA" address="0x00009888" value="0x541F0024" />
+        <register type="NOA" address="0x00009888" value="0x3A1F8000" />
+        <register type="NOA" address="0x00009888" value="0x4E1F2400" />
+        <register type="NOA" address="0x00009888" value="0x501F0024" />
+        <register type="NOA" address="0x00009888" value="0x3E1F0100" />
+        <register type="NOA" address="0x00009888" value="0x4C1F3030" />
+        <register type="NOA" address="0x00009888" value="0x401F0000" />
+        <register type="NOA" address="0x00009888" value="0x421F3000" />
+        <register type="NOA" address="0x00009888" value="0x441F3330" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x10800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00000002" />
+        <register type="OA" address="0x00002774" value="0x0000FFFE" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+    </register_config>
+  </set>
+
+  <set name="Metric set RasterizerAndPixelBackend"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="rasterizer_and_pixel_backend"
+       hw_config_guid="20df0e83-535f-457f-a08b-76aee88c1e0e"
+       chipset="LKF"
+       symbol_name="RasterizerAndPixelBackend"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 Pipe0 PS Output Available"
+             description="The percentage of time in which slice0 pipe0 PS output is available"
+             data_type="float"
+             max_equation="100"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_output00_available"
+             units="percent"
+             symbol_name="PSOutput00Available"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Slice0 Pipe1 PS Output Available"
+             description="The percentage of time in which slice0 pipe1 PS output is available"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_output01_available"
+             units="percent"
+             symbol_name="PSOutput01Available"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Slice0 Pipe1 Pixel Values Ready"
+             description="The percentage of time in which slice0 pipe1 pixel values are ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="pixel_values01_ready"
+             units="percent"
+             symbol_name="PixelValues01Ready"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Slice0 Pipe0 Post-EarlyZ Pixel Data Ready"
+             description="The percentage of time in which slice0  pipe0 post-EarlyZ pixel data is ready (after early Z tests have been applied)"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="pixel_data00_ready"
+             units="percent"
+             symbol_name="PixelData00Ready"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer/Early Depth Test"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="Slice0 Pipe1 Post-EarlyZ Pixel Data Ready"
+             description="The percentage of time in which slice0  pipe1 post-EarlyZ pixel data is ready (after early Z tests have been applied)"
+             data_type="float"
+             max_equation="100"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="pixel_data01_ready"
+             units="percent"
+             symbol_name="PixelData01Ready"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer/Early Depth Test"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="Slice0 Rasterizer Input Available"
+             description="The percentage of time in which slice0 rasterizer input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="rasterizer0_input_available"
+             units="percent"
+             symbol_name="Rasterizer0InputAvailable"
+             availability="$SliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="Slice0 Pipe0 Pixel Values Ready"
+             description="The percentage of time in which slice0 pipe0 pixel values are ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="pixel_values00_ready"
+             units="percent"
+             symbol_name="PixelValues00Ready"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 Rasterizer Output Ready"
+             description="The percentage of time in which slice0 rasterizer output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="rasterizer0_output_ready"
+             units="percent"
+             symbol_name="Rasterizer0OutputReady"
+             availability="$SliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ A 31 READ UADD A 32 READ UADD 64 UMUL"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009840" value="0x00000000" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x120A03E0" />
+        <register type="NOA" address="0x00009888" value="0x140C0500" />
+        <register type="NOA" address="0x00009888" value="0x120F03E0" />
+        <register type="NOA" address="0x00009888" value="0x14110500" />
+        <register type="NOA" address="0x00009888" value="0x10136000" />
+        <register type="NOA" address="0x00009888" value="0x1213001C" />
+        <register type="NOA" address="0x00009888" value="0x16140000" />
+        <register type="NOA" address="0x00009888" value="0x10160018" />
+        <register type="NOA" address="0x00009888" value="0x101A0018" />
+        <register type="NOA" address="0x00009888" value="0x0C045400" />
+        <register type="NOA" address="0x00009888" value="0x0E045545" />
+        <register type="NOA" address="0x00009888" value="0x04055000" />
+        <register type="NOA" address="0x00009888" value="0x0A055000" />
+        <register type="NOA" address="0x00009888" value="0x0C055000" />
+        <register type="NOA" address="0x00009888" value="0x0E051000" />
+        <register type="NOA" address="0x00009888" value="0x06055000" />
+        <register type="NOA" address="0x00009888" value="0x08051000" />
+        <register type="NOA" address="0x00009888" value="0x2406DF00" />
+        <register type="NOA" address="0x00009888" value="0x26060007" />
+        <register type="NOA" address="0x00009888" value="0x02084000" />
+        <register type="NOA" address="0x00009888" value="0x04098000" />
+        <register type="NOA" address="0x00009888" value="0x06094000" />
+        <register type="NOA" address="0x00009888" value="0x000A0C40" />
+        <register type="NOA" address="0x00009888" value="0x0C0A0000" />
+        <register type="NOA" address="0x00009888" value="0x040A0000" />
+        <register type="NOA" address="0x00009888" value="0x020C0B80" />
+        <register type="NOA" address="0x00009888" value="0x080C0000" />
+        <register type="NOA" address="0x00009888" value="0x040D1000" />
+        <register type="NOA" address="0x00009888" value="0x060E2000" />
+        <register type="NOA" address="0x00009888" value="0x080E1000" />
+        <register type="NOA" address="0x00009888" value="0x020F0031" />
+        <register type="NOA" address="0x00009888" value="0x0C0F0000" />
+        <register type="NOA" address="0x00009888" value="0x040F0000" />
+        <register type="NOA" address="0x00009888" value="0x04110017" />
+        <register type="NOA" address="0x00009888" value="0x08110000" />
+        <register type="NOA" address="0x00009888" value="0x18120C00" />
+        <register type="NOA" address="0x00009888" value="0x02128000" />
+        <register type="NOA" address="0x00009888" value="0x06128000" />
+        <register type="NOA" address="0x00009888" value="0x0613092F" />
+        <register type="NOA" address="0x00009888" value="0x08134025" />
+        <register type="NOA" address="0x00009888" value="0x0C130000" />
+        <register type="NOA" address="0x00009888" value="0x0413A000" />
+        <register type="NOA" address="0x00009888" value="0x00148066" />
+        <register type="NOA" address="0x00009888" value="0x10140000" />
+        <register type="NOA" address="0x00009888" value="0x0614C000" />
+        <register type="NOA" address="0x00009888" value="0x08144000" />
+        <register type="NOA" address="0x00009888" value="0x0A144000" />
+        <register type="NOA" address="0x00009888" value="0x02148000" />
+        <register type="NOA" address="0x00009888" value="0x00154000" />
+        <register type="NOA" address="0x00009888" value="0x0E154000" />
+        <register type="NOA" address="0x00009888" value="0x161500E8" />
+        <register type="NOA" address="0x00009888" value="0x02154000" />
+        <register type="NOA" address="0x00009888" value="0x04158000" />
+        <register type="NOA" address="0x00009888" value="0x06154000" />
+        <register type="NOA" address="0x00009888" value="0x08158000" />
+        <register type="NOA" address="0x00009888" value="0x0C154000" />
+        <register type="NOA" address="0x00009888" value="0x08161000" />
+        <register type="NOA" address="0x00009888" value="0x08184000" />
+        <register type="NOA" address="0x00009888" value="0x12190100" />
+        <register type="NOA" address="0x00009888" value="0x0A1A0020" />
+        <register type="NOA" address="0x00009888" value="0x081A0000" />
+        <register type="NOA" address="0x00009888" value="0x0A1C1000" />
+        <register type="NOA" address="0x00009888" value="0x121D0400" />
+        <register type="NOA" address="0x00009884" value="0x00000003" />
+        <register type="NOA" address="0x00009888" value="0x1C1F3000" />
+        <register type="NOA" address="0x00009888" value="0x1A1F0061" />
+        <register type="NOA" address="0x00009888" value="0x141F0000" />
+        <register type="NOA" address="0x00009888" value="0x301F8000" />
+        <register type="NOA" address="0x00009888" value="0x501F4904" />
+        <register type="NOA" address="0x00009888" value="0x521F0024" />
+        <register type="NOA" address="0x00009888" value="0x3A1F8000" />
+        <register type="NOA" address="0x00009888" value="0x4E1F2400" />
+        <register type="NOA" address="0x00009888" value="0x3E1F5000" />
+        <register type="NOA" address="0x00009888" value="0x461F4040" />
+        <register type="NOA" address="0x00009888" value="0x481F0030" />
+        <register type="NOA" address="0x00009888" value="0x401F4010" />
+        <register type="NOA" address="0x00009888" value="0x421F3000" />
+        <register type="NOA" address="0x00009888" value="0x441F4023" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x70800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00000038" />
+        <register type="OA" address="0x00002774" value="0x0000FFF8" />
+        <register type="OA" address="0x00002778" value="0x00000002" />
+        <register type="OA" address="0x0000277C" value="0x0000FFF7" />
+        <register type="OA" address="0x00002780" value="0x00000002" />
+        <register type="OA" address="0x00002784" value="0x0000FFEF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+    </register_config>
+  </set>
+
+  <set name="Metric set L3_1"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="l3_1"
+       hw_config_guid="c7d3dc5c-975d-4d3a-a4c8-86fb0085743b"
+       chipset="LKF"
+       symbol_name="L3_1"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank1 Active"
+             description="The percentage of time in which slice0 L3 bank1 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank1_active"
+             units="percent"
+             symbol_name="L30Bank1Active"
+             availability="$SliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="B 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Slice0 L3 Bank5 Active"
+             description="The percentage of time in which slice0 L3 bank5 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank5_active"
+             units="percent"
+             symbol_name="L30Bank5Active"
+             availability="$SliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank3 Active"
+             description="The percentage of time in which slice0 L3 bank3 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank3_active"
+             units="percent"
+             symbol_name="L30Bank3Active"
+             availability="$SliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank6 Active"
+             description="The percentage of time in which slice0 L3 bank6 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank6_active"
+             units="percent"
+             symbol_name="L30Bank6Active"
+             availability="$SliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Slice0 L3 Bank2 Active"
+             description="The percentage of time in which slice0 L3 bank2 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank2_active"
+             units="percent"
+             symbol_name="L30Bank2Active"
+             availability="$SliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Slice0 L3 Bank0 Active"
+             description="The percentage of time in which slice0 L3 bank0 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank0_active"
+             units="percent"
+             symbol_name="L30Bank0Active"
+             availability="$SliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Slice0 L3 Bank7 Active"
+             description="The percentage of time in which slice0 L3 bank7 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank7_active"
+             units="percent"
+             symbol_name="L30Bank7Active"
+             availability="$SliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Slice0 L3 Bank4 Active"
+             description="The percentage of time in which slice0 L3 bank4 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank4_active"
+             units="percent"
+             symbol_name="L30Bank4Active"
+             availability="$SliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ A 31 READ UADD A 32 READ UADD 64 UMUL"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009840" value="0x00000000" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x17340000" />
+        <register type="NOA" address="0x00009888" value="0x17740000" />
+        <register type="NOA" address="0x00009888" value="0x17B40000" />
+        <register type="NOA" address="0x00009888" value="0x17F40000" />
+        <register type="NOA" address="0x00009888" value="0x16340000" />
+        <register type="NOA" address="0x00009888" value="0x16740000" />
+        <register type="NOA" address="0x00009888" value="0x16B40000" />
+        <register type="NOA" address="0x00009888" value="0x16F40000" />
+        <register type="NOA" address="0x00009888" value="0x07340017" />
+        <register type="NOA" address="0x00009888" value="0x27340000" />
+        <register type="NOA" address="0x00009888" value="0x09740017" />
+        <register type="NOA" address="0x00009888" value="0x27740000" />
+        <register type="NOA" address="0x00009888" value="0x0BB40017" />
+        <register type="NOA" address="0x00009888" value="0x27B40000" />
+        <register type="NOA" address="0x00009888" value="0x0DF40017" />
+        <register type="NOA" address="0x00009888" value="0x27F40000" />
+        <register type="NOA" address="0x00009888" value="0x0E0000A7" />
+        <register type="NOA" address="0x00009888" value="0x08012000" />
+        <register type="NOA" address="0x00009888" value="0x0A034000" />
+        <register type="NOA" address="0x00009888" value="0x0C038000" />
+        <register type="NOA" address="0x00009888" value="0x1C340017" />
+        <register type="NOA" address="0x00009888" value="0x26340000" />
+        <register type="NOA" address="0x00009888" value="0x1E740017" />
+        <register type="NOA" address="0x00009888" value="0x26740000" />
+        <register type="NOA" address="0x00009888" value="0x02B40017" />
+        <register type="NOA" address="0x00009888" value="0x26B40000" />
+        <register type="NOA" address="0x00009888" value="0x04F40017" />
+        <register type="NOA" address="0x00009888" value="0x26F40000" />
+        <register type="NOA" address="0x00009888" value="0x10040200" />
+        <register type="NOA" address="0x00009888" value="0x0E040055" />
+        <register type="NOA" address="0x00009888" value="0x14050070" />
+        <register type="NOA" address="0x00009888" value="0x04058000" />
+        <register type="NOA" address="0x00009888" value="0x06056000" />
+        <register type="NOA" address="0x00009888" value="0x08055000" />
+        <register type="NOA" address="0x00009888" value="0x0A051000" />
+        <register type="NOA" address="0x00009888" value="0x260600C0" />
+        <register type="NOA" address="0x00009888" value="0x24067E00" />
+        <register type="NOA" address="0x00009888" value="0x02074000" />
+        <register type="NOA" address="0x00009888" value="0x04078000" />
+        <register type="NOA" address="0x00009888" value="0x06124000" />
+        <register type="NOA" address="0x00009888" value="0x08124000" />
+        <register type="NOA" address="0x00009888" value="0x0A124000" />
+        <register type="NOA" address="0x00009888" value="0x0C124000" />
+        <register type="NOA" address="0x00009888" value="0x04138000" />
+        <register type="NOA" address="0x00009888" value="0x06137000" />
+        <register type="NOA" address="0x00009888" value="0x02148000" />
+        <register type="NOA" address="0x00009888" value="0x0414C000" />
+        <register type="NOA" address="0x00009888" value="0x06144000" />
+        <register type="NOA" address="0x00009888" value="0x06154000" />
+        <register type="NOA" address="0x00009888" value="0x08154000" />
+        <register type="NOA" address="0x00009888" value="0x0A154000" />
+        <register type="NOA" address="0x00009888" value="0x0C154000" />
+        <register type="NOA" address="0x00009884" value="0x00000003" />
+        <register type="NOA" address="0x00009888" value="0x1C1F3000" />
+        <register type="NOA" address="0x00009888" value="0x2A1F0061" />
+        <register type="NOA" address="0x00009888" value="0x141F0000" />
+        <register type="NOA" address="0x00009888" value="0x521F0000" />
+        <register type="NOA" address="0x00009888" value="0x541F0024" />
+        <register type="NOA" address="0x00009888" value="0x3A1F8000" />
+        <register type="NOA" address="0x00009888" value="0x4E1F2460" />
+        <register type="NOA" address="0x00009888" value="0x501F0124" />
+        <register type="NOA" address="0x00009888" value="0x4C1F0133" />
+        <register type="NOA" address="0x00009888" value="0x301F0000" />
+        <register type="NOA" address="0x00009888" value="0x401F6060" />
+        <register type="NOA" address="0x00009888" value="0x421F0010" />
+        <register type="NOA" address="0x00009888" value="0x441F0000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+    </register_config>
+  </set>
+
+  <set name="Gen11 L2Bank0 stalled metric set"
+       mdapi_supported_apis="VK OGL OGL4 OCL MEDIA IO BB"
+       underscore_name="l3_2"
+       hw_config_guid="04003388-30ef-45d6-ae89-86f71ee596f4"
+       chipset="LKF"
+       symbol_name="L3_2"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 14 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank0 Stalled"
+             description="The percentage of time in which slice0 L3 bank0 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ B 1 READ FADD B 2 READ FADD B 3 READ FADD 4 FDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank0_stalled"
+             units="percent"
+             symbol_name="L30Bank0Stalled"
+             availability="$SliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="EU Thread Occupancy"
+             description="The percentage of time in which hardware threads occupied EUs."
+             data_type="float"
+             max_equation="100"
+             equation="8 A 10 READ FMUL $EuThreadsCount FDIV $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_thread_occupancy"
+             units="percent"
+             symbol_name="EuThreadOccupancy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009840" value="0x00000000" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x10050C00" />
+        <register type="NOA" address="0x00009888" value="0x12050002" />
+        <register type="NOA" address="0x00009888" value="0x00050025" />
+        <register type="NOA" address="0x00009888" value="0x06050900" />
+        <register type="NOA" address="0x00009888" value="0x080508EA" />
+        <register type="NOA" address="0x00009888" value="0x0A0508AB" />
+        <register type="NOA" address="0x00009888" value="0x0C050A21" />
+        <register type="NOA" address="0x00009888" value="0x0E050A60" />
+        <register type="NOA" address="0x00009888" value="0x04050000" />
+        <register type="NOA" address="0x00009888" value="0x14050000" />
+        <register type="NOA" address="0x00009888" value="0x24068100" />
+        <register type="NOA" address="0x00009888" value="0x260600FF" />
+        <register type="NOA" address="0x00009884" value="0x00000003" />
+        <register type="NOA" address="0x00009888" value="0x301F8000" />
+        <register type="NOA" address="0x00009888" value="0x501F4800" />
+        <register type="NOA" address="0x00009888" value="0x521F4924" />
+        <register type="NOA" address="0x00009888" value="0x541F0024" />
+        <register type="NOA" address="0x00009888" value="0x3E1F0000" />
+        <register type="NOA" address="0x00009888" value="0x461F0000" />
+        <register type="NOA" address="0x00009888" value="0x481F0000" />
+        <register type="NOA" address="0x00009888" value="0x4A1F0000" />
+        <register type="NOA" address="0x00009888" value="0x4C1F0000" />
+        <register type="NOA" address="0x00009888" value="0x141F0000" />
+        <register type="NOA" address="0x00009888" value="0x4E1F0000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00000022" />
+        <register type="OA" address="0x00002774" value="0x0000FFF8" />
+        <register type="OA" address="0x00002778" value="0x00000082" />
+        <register type="OA" address="0x0000277C" value="0x0000FFE7" />
+        <register type="OA" address="0x00002780" value="0x00000402" />
+        <register type="OA" address="0x00002784" value="0x0000FF1F" />
+        <register type="OA" address="0x00002788" value="0x00001002" />
+        <register type="OA" address="0x0000278C" value="0x0000FCFF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00008003" />
+        <register type="FLEX" address="0x0000E658" value="0x00011010" />
+        <register type="FLEX" address="0x0000E758" value="0x00050012" />
+        <register type="FLEX" address="0x0000E45C" value="0x00052051" />
+        <register type="FLEX" address="0x0000E55C" value="0x00000053" />
+    </register_config>
+  </set>
+
+  <set name="Gen11 L2Bank1 stalled metric set"
+       mdapi_supported_apis="VK OGL OGL4 OCL MEDIA IO BB"
+       underscore_name="l3_3"
+       hw_config_guid="12f706a4-3761-4448-83dc-63495da010ff"
+       chipset="LKF"
+       symbol_name="L3_3"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="Slice0 L3 Bank1 Stalled"
+             description="The percentage of time in which slice0 L3 bank1 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ B 1 READ FADD B 2 READ FADD B 3 READ FADD 4 FDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank1_stalled"
+             units="percent"
+             symbol_name="L30Bank1Stalled"
+             availability="$SliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 14 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="EU Thread Occupancy"
+             description="The percentage of time in which hardware threads occupied EUs."
+             data_type="float"
+             max_equation="100"
+             equation="8 A 10 READ FMUL $EuThreadsCount FDIV $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_thread_occupancy"
+             units="percent"
+             symbol_name="EuThreadOccupancy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009840" value="0x00000000" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x10050400" />
+        <register type="NOA" address="0x00009888" value="0x12050000" />
+        <register type="NOA" address="0x00009888" value="0x00050025" />
+        <register type="NOA" address="0x00009888" value="0x06050900" />
+        <register type="NOA" address="0x00009888" value="0x080508EA" />
+        <register type="NOA" address="0x00009888" value="0x0A0508AB" />
+        <register type="NOA" address="0x00009888" value="0x0C050A21" />
+        <register type="NOA" address="0x00009888" value="0x0E050A60" />
+        <register type="NOA" address="0x00009888" value="0x04050000" />
+        <register type="NOA" address="0x00009888" value="0x14050000" />
+        <register type="NOA" address="0x00009888" value="0x24068100" />
+        <register type="NOA" address="0x00009888" value="0x260600FF" />
+        <register type="NOA" address="0x00009884" value="0x00000003" />
+        <register type="NOA" address="0x00009888" value="0x301F8000" />
+        <register type="NOA" address="0x00009888" value="0x501F4800" />
+        <register type="NOA" address="0x00009888" value="0x521F4924" />
+        <register type="NOA" address="0x00009888" value="0x541F0024" />
+        <register type="NOA" address="0x00009888" value="0x3E1F0000" />
+        <register type="NOA" address="0x00009888" value="0x461F0000" />
+        <register type="NOA" address="0x00009888" value="0x481F0000" />
+        <register type="NOA" address="0x00009888" value="0x4A1F0000" />
+        <register type="NOA" address="0x00009888" value="0x4C1F0000" />
+        <register type="NOA" address="0x00009888" value="0x141F0000" />
+        <register type="NOA" address="0x00009888" value="0x4E1F0000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00000022" />
+        <register type="OA" address="0x00002774" value="0x0000FFF8" />
+        <register type="OA" address="0x00002778" value="0x00000082" />
+        <register type="OA" address="0x0000277C" value="0x0000FFE7" />
+        <register type="OA" address="0x00002780" value="0x00000402" />
+        <register type="OA" address="0x00002784" value="0x0000FF1F" />
+        <register type="OA" address="0x00002788" value="0x00001002" />
+        <register type="OA" address="0x0000278C" value="0x0000FCFF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00008003" />
+        <register type="FLEX" address="0x0000E658" value="0x00011010" />
+        <register type="FLEX" address="0x0000E758" value="0x00050012" />
+        <register type="FLEX" address="0x0000E45C" value="0x00052051" />
+        <register type="FLEX" address="0x0000E55C" value="0x00000053" />
+    </register_config>
+  </set>
+
+  <set name="Gen11 L2Bank4 stalled metric set"
+       mdapi_supported_apis="VK OGL OGL4 OCL MEDIA IO BB"
+       underscore_name="l3_4"
+       hw_config_guid="b03ae6f7-fdc0-4879-9e65-5b221ac9625f"
+       chipset="LKF"
+       symbol_name="L3_4"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 14 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Slice0 L3 Bank4 Stalled"
+             description="The percentage of time in which slice0 L3 bank4 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ B 1 READ FADD B 2 READ FADD B 3 READ FADD 4 FDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank4_stalled"
+             units="percent"
+             symbol_name="L30Bank4Stalled"
+             availability="$SliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="EU Thread Occupancy"
+             description="The percentage of time in which hardware threads occupied EUs."
+             data_type="float"
+             max_equation="100"
+             equation="8 A 10 READ FMUL $EuThreadsCount FDIV $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_thread_occupancy"
+             units="percent"
+             symbol_name="EuThreadOccupancy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009840" value="0x00000000" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x10010C00" />
+        <register type="NOA" address="0x00009888" value="0x12010002" />
+        <register type="NOA" address="0x00009888" value="0x0C000400" />
+        <register type="NOA" address="0x00009888" value="0x0E005500" />
+        <register type="NOA" address="0x00009888" value="0x10000155" />
+        <register type="NOA" address="0x00009888" value="0x00010025" />
+        <register type="NOA" address="0x00009888" value="0x06010900" />
+        <register type="NOA" address="0x00009888" value="0x080108EA" />
+        <register type="NOA" address="0x00009888" value="0x0A0108AB" />
+        <register type="NOA" address="0x00009888" value="0x0C010A21" />
+        <register type="NOA" address="0x00009888" value="0x0E010A60" />
+        <register type="NOA" address="0x00009888" value="0x04010000" />
+        <register type="NOA" address="0x00009888" value="0x14010000" />
+        <register type="NOA" address="0x00009888" value="0x0C040400" />
+        <register type="NOA" address="0x00009888" value="0x0E045500" />
+        <register type="NOA" address="0x00009888" value="0x10040155" />
+        <register type="NOA" address="0x00009888" value="0x04051000" />
+        <register type="NOA" address="0x00009888" value="0x0A054000" />
+        <register type="NOA" address="0x00009888" value="0x0C055000" />
+        <register type="NOA" address="0x00009888" value="0x0E055000" />
+        <register type="NOA" address="0x00009888" value="0x14050055" />
+        <register type="NOA" address="0x00009888" value="0x24068100" />
+        <register type="NOA" address="0x00009888" value="0x260600FF" />
+        <register type="NOA" address="0x00009888" value="0x00124000" />
+        <register type="NOA" address="0x00009888" value="0x0E124000" />
+        <register type="NOA" address="0x00009888" value="0x18125540" />
+        <register type="NOA" address="0x00009888" value="0x1A120015" />
+        <register type="NOA" address="0x00009888" value="0x04131000" />
+        <register type="NOA" address="0x00009888" value="0x06138000" />
+        <register type="NOA" address="0x00009888" value="0x0813F000" />
+        <register type="NOA" address="0x00009888" value="0x0A13F000" />
+        <register type="NOA" address="0x00009888" value="0x00144000" />
+        <register type="NOA" address="0x00009888" value="0x06148000" />
+        <register type="NOA" address="0x00009888" value="0x0814C000" />
+        <register type="NOA" address="0x00009888" value="0x0A14C000" />
+        <register type="NOA" address="0x00009888" value="0x0C14C000" />
+        <register type="NOA" address="0x00009888" value="0x0E14C000" />
+        <register type="NOA" address="0x00009888" value="0x00154000" />
+        <register type="NOA" address="0x00009888" value="0x0E154000" />
+        <register type="NOA" address="0x00009888" value="0x16152AA8" />
+        <register type="NOA" address="0x00009888" value="0x18150005" />
+        <register type="NOA" address="0x00009884" value="0x00000003" />
+        <register type="NOA" address="0x00009888" value="0x301F8000" />
+        <register type="NOA" address="0x00009888" value="0x501F4800" />
+        <register type="NOA" address="0x00009888" value="0x521F4924" />
+        <register type="NOA" address="0x00009888" value="0x541F0024" />
+        <register type="NOA" address="0x00009888" value="0x3E1F0000" />
+        <register type="NOA" address="0x00009888" value="0x461F0000" />
+        <register type="NOA" address="0x00009888" value="0x481F0000" />
+        <register type="NOA" address="0x00009888" value="0x4A1F0000" />
+        <register type="NOA" address="0x00009888" value="0x4C1F0000" />
+        <register type="NOA" address="0x00009888" value="0x141F0000" />
+        <register type="NOA" address="0x00009888" value="0x4E1F0000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00000022" />
+        <register type="OA" address="0x00002774" value="0x0000FFF8" />
+        <register type="OA" address="0x00002778" value="0x00000082" />
+        <register type="OA" address="0x0000277C" value="0x0000FFE7" />
+        <register type="OA" address="0x00002780" value="0x00000402" />
+        <register type="OA" address="0x00002784" value="0x0000FF1F" />
+        <register type="OA" address="0x00002788" value="0x00001002" />
+        <register type="OA" address="0x0000278C" value="0x0000FCFF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00008003" />
+        <register type="FLEX" address="0x0000E658" value="0x00011010" />
+        <register type="FLEX" address="0x0000E758" value="0x00050012" />
+        <register type="FLEX" address="0x0000E45C" value="0x00052051" />
+        <register type="FLEX" address="0x0000E55C" value="0x00000053" />
+    </register_config>
+  </set>
+
+  <set name="Gen11 L2Bank5 stalled metric set"
+       mdapi_supported_apis="VK OGL OGL4 OCL MEDIA IO BB"
+       underscore_name="l3_5"
+       hw_config_guid="cdec4315-3c8d-416f-b3ae-33f7590e1439"
+       chipset="LKF"
+       symbol_name="L3_5"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 14 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Slice0 L3 Bank5 Stalled"
+             description="The percentage of time in which slice0 L3 bank5 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 2 READ B 3 READ FADD B 0 READ FADD B 1 READ FADD 4 FDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank5_stalled"
+             units="percent"
+             symbol_name="L30Bank5Stalled"
+             availability="$SliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="EU Thread Occupancy"
+             description="The percentage of time in which hardware threads occupied EUs."
+             data_type="float"
+             max_equation="100"
+             equation="8 A 10 READ FMUL $EuThreadsCount FDIV $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_thread_occupancy"
+             units="percent"
+             symbol_name="EuThreadOccupancy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009840" value="0x00000000" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x10010400" />
+        <register type="NOA" address="0x00009888" value="0x12010000" />
+        <register type="NOA" address="0x00009888" value="0x0C000400" />
+        <register type="NOA" address="0x00009888" value="0x0E005500" />
+        <register type="NOA" address="0x00009888" value="0x10000155" />
+        <register type="NOA" address="0x00009888" value="0x00010022" />
+        <register type="NOA" address="0x00009888" value="0x06010840" />
+        <register type="NOA" address="0x00009888" value="0x08010828" />
+        <register type="NOA" address="0x00009888" value="0x0A010969" />
+        <register type="NOA" address="0x00009888" value="0x0C010AA4" />
+        <register type="NOA" address="0x00009888" value="0x0E010AE3" />
+        <register type="NOA" address="0x00009888" value="0x04010000" />
+        <register type="NOA" address="0x00009888" value="0x14010000" />
+        <register type="NOA" address="0x00009888" value="0x0C040400" />
+        <register type="NOA" address="0x00009888" value="0x0E045500" />
+        <register type="NOA" address="0x00009888" value="0x10040155" />
+        <register type="NOA" address="0x00009888" value="0x04051000" />
+        <register type="NOA" address="0x00009888" value="0x0A054000" />
+        <register type="NOA" address="0x00009888" value="0x0C055000" />
+        <register type="NOA" address="0x00009888" value="0x0E055000" />
+        <register type="NOA" address="0x00009888" value="0x14050055" />
+        <register type="NOA" address="0x00009888" value="0x24068100" />
+        <register type="NOA" address="0x00009888" value="0x260600FF" />
+        <register type="NOA" address="0x00009888" value="0x00124000" />
+        <register type="NOA" address="0x00009888" value="0x0E124000" />
+        <register type="NOA" address="0x00009888" value="0x18125540" />
+        <register type="NOA" address="0x00009888" value="0x1A120015" />
+        <register type="NOA" address="0x00009888" value="0x04131000" />
+        <register type="NOA" address="0x00009888" value="0x06138000" />
+        <register type="NOA" address="0x00009888" value="0x0813F000" />
+        <register type="NOA" address="0x00009888" value="0x0A13F000" />
+        <register type="NOA" address="0x00009888" value="0x00144000" />
+        <register type="NOA" address="0x00009888" value="0x06148000" />
+        <register type="NOA" address="0x00009888" value="0x0814C000" />
+        <register type="NOA" address="0x00009888" value="0x0A14C000" />
+        <register type="NOA" address="0x00009888" value="0x0C14C000" />
+        <register type="NOA" address="0x00009888" value="0x0E14C000" />
+        <register type="NOA" address="0x00009888" value="0x00154000" />
+        <register type="NOA" address="0x00009888" value="0x0E154000" />
+        <register type="NOA" address="0x00009888" value="0x16152AA8" />
+        <register type="NOA" address="0x00009888" value="0x18150005" />
+        <register type="NOA" address="0x00009884" value="0x00000003" />
+        <register type="NOA" address="0x00009888" value="0x301F8000" />
+        <register type="NOA" address="0x00009888" value="0x501F4800" />
+        <register type="NOA" address="0x00009888" value="0x521F4924" />
+        <register type="NOA" address="0x00009888" value="0x541F0024" />
+        <register type="NOA" address="0x00009888" value="0x3E1F0000" />
+        <register type="NOA" address="0x00009888" value="0x461F0000" />
+        <register type="NOA" address="0x00009888" value="0x481F0000" />
+        <register type="NOA" address="0x00009888" value="0x4A1F0000" />
+        <register type="NOA" address="0x00009888" value="0x4C1F0000" />
+        <register type="NOA" address="0x00009888" value="0x141F0000" />
+        <register type="NOA" address="0x00009888" value="0x4E1F0000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00000022" />
+        <register type="OA" address="0x00002774" value="0x0000FFF8" />
+        <register type="OA" address="0x00002778" value="0x00000082" />
+        <register type="OA" address="0x0000277C" value="0x0000FFE7" />
+        <register type="OA" address="0x00002780" value="0x00000402" />
+        <register type="OA" address="0x00002784" value="0x0000FF1F" />
+        <register type="OA" address="0x00002788" value="0x00001002" />
+        <register type="OA" address="0x0000278C" value="0x0000FCFF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00008003" />
+        <register type="FLEX" address="0x0000E658" value="0x00011010" />
+        <register type="FLEX" address="0x0000E758" value="0x00050012" />
+        <register type="FLEX" address="0x0000E45C" value="0x00052051" />
+        <register type="FLEX" address="0x0000E55C" value="0x00000053" />
+    </register_config>
+  </set>
+
+  <set name="Metric set Sampler 1"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="sampler_1"
+       hw_config_guid="377c06c4-5f41-465a-bf2e-60d95200ba94"
+       chipset="LKF"
+       symbol_name="Sampler_1"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 Subslice2 Input Available"
+             description="The percentage of time in which slice0 subslice2 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler02_input_available"
+             units="percent"
+             symbol_name="Sampler02InputAvailable"
+             availability="$SubsliceMask 4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 Subslice0 Input Available"
+             description="The percentage of time in which slice0 subslice0 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler00_input_available"
+             units="percent"
+             symbol_name="Sampler00InputAvailable"
+             availability="$SubsliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Slice0 Subslice1 Input Available"
+             description="The percentage of time in which slice0 subslice1 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler01_input_available"
+             units="percent"
+             symbol_name="Sampler01InputAvailable"
+             availability="$SubsliceMask 2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Slice0 Subslice6 Input Available"
+             description="The percentage of time in which slice0 subslice6 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler06_input_available"
+             units="percent"
+             symbol_name="Sampler06InputAvailable"
+             availability="$SubsliceMask 64 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 Subslice4 Input Available"
+             description="The percentage of time in which slice0 subslice4 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler04_input_available"
+             units="percent"
+             symbol_name="Sampler04InputAvailable"
+             availability="$SubsliceMask 16 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="Slice0 Subslice3 Input Available"
+             description="The percentage of time in which slice0 subslice3 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler03_input_available"
+             units="percent"
+             symbol_name="Sampler03InputAvailable"
+             availability="$SubsliceMask 8 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 Subslice5 Input Available"
+             description="The percentage of time in which slice0 subslice5 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler05_input_available"
+             units="percent"
+             symbol_name="Sampler05InputAvailable"
+             availability="$SubsliceMask 32 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Slice0 Subslice7 Input Available"
+             description="The percentage of time in which slice0 subslice7 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler07_input_available"
+             units="percent"
+             symbol_name="Sampler07InputAvailable"
+             availability="$SubsliceMask 128 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ A 31 READ UADD A 32 READ UADD 64 UMUL"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009840" value="0x00000000" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x142A0165" />
+        <register type="NOA" address="0x00009888" value="0x142F0165" />
+        <register type="NOA" address="0x00009888" value="0x146A0165" />
+        <register type="NOA" address="0x00009888" value="0x146F0165" />
+        <register type="NOA" address="0x00009888" value="0x14AA0165" />
+        <register type="NOA" address="0x00009888" value="0x14AF0165" />
+        <register type="NOA" address="0x00009888" value="0x14EA0165" />
+        <register type="NOA" address="0x00009888" value="0x14EF0165" />
+        <register type="NOA" address="0x00009888" value="0x161E8000" />
+        <register type="NOA" address="0x00009888" value="0x181E8000" />
+        <register type="NOA" address="0x00009888" value="0x1C1E1800" />
+        <register type="NOA" address="0x00009888" value="0x06204000" />
+        <register type="NOA" address="0x00009888" value="0x08204000" />
+        <register type="NOA" address="0x00009888" value="0x0A204000" />
+        <register type="NOA" address="0x00009888" value="0x0C204000" />
+        <register type="NOA" address="0x00009888" value="0x16218000" />
+        <register type="NOA" address="0x00009888" value="0x18218000" />
+        <register type="NOA" address="0x00009888" value="0x1E210018" />
+        <register type="NOA" address="0x00009888" value="0x042A1800" />
+        <register type="NOA" address="0x00009888" value="0x062AC038" />
+        <register type="NOA" address="0x00009888" value="0x102A0000" />
+        <register type="NOA" address="0x00009888" value="0x082AC000" />
+        <register type="NOA" address="0x00009888" value="0x0A2A0000" />
+        <register type="NOA" address="0x00009888" value="0x0C2A0000" />
+        <register type="NOA" address="0x00009888" value="0x062C4000" />
+        <register type="NOA" address="0x00009888" value="0x082C4000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C4000" />
+        <register type="NOA" address="0x00009888" value="0x0C2C4000" />
+        <register type="NOA" address="0x00009888" value="0x022F2000" />
+        <register type="NOA" address="0x00009888" value="0x042F0048" />
+        <register type="NOA" address="0x00009888" value="0x102F0000" />
+        <register type="NOA" address="0x00009888" value="0x062F0000" />
+        <register type="NOA" address="0x00009888" value="0x082F0000" />
+        <register type="NOA" address="0x00009888" value="0x1E5E0030" />
+        <register type="NOA" address="0x00009888" value="0x125E8000" />
+        <register type="NOA" address="0x00009888" value="0x145E8000" />
+        <register type="NOA" address="0x00009888" value="0x1A604000" />
+        <register type="NOA" address="0x00009888" value="0x1C600001" />
+        <register type="NOA" address="0x00009888" value="0x02604000" />
+        <register type="NOA" address="0x00009888" value="0x04604000" />
+        <register type="NOA" address="0x00009888" value="0x1E613000" />
+        <register type="NOA" address="0x00009888" value="0x12618000" />
+        <register type="NOA" address="0x00009888" value="0x14618000" />
+        <register type="NOA" address="0x00009888" value="0x006A1800" />
+        <register type="NOA" address="0x00009888" value="0x026A0038" />
+        <register type="NOA" address="0x00009888" value="0x106A0000" />
+        <register type="NOA" address="0x00009888" value="0x1A6A00F0" />
+        <register type="NOA" address="0x00009888" value="0x046A0000" />
+        <register type="NOA" address="0x00009888" value="0x186C5000" />
+        <register type="NOA" address="0x00009888" value="0x026C4000" />
+        <register type="NOA" address="0x00009888" value="0x046C4000" />
+        <register type="NOA" address="0x00009888" value="0x0E6F2440" />
+        <register type="NOA" address="0x00009888" value="0x106F0000" />
+        <register type="NOA" address="0x00009888" value="0x1A6F0000" />
+        <register type="NOA" address="0x00009888" value="0x1E9E000F" />
+        <register type="NOA" address="0x00009888" value="0x1AA01540" />
+        <register type="NOA" address="0x00009888" value="0x1EA10F00" />
+        <register type="NOA" address="0x00009888" value="0x0CAA1C30" />
+        <register type="NOA" address="0x00009888" value="0x10AA0000" />
+        <register type="NOA" address="0x00009888" value="0x18AAF000" />
+        <register type="NOA" address="0x00009888" value="0x1AAA0000" />
+        <register type="NOA" address="0x00009888" value="0x18AC0550" />
+        <register type="NOA" address="0x00009888" value="0x0AAF2440" />
+        <register type="NOA" address="0x00009888" value="0x10AF0000" />
+        <register type="NOA" address="0x00009888" value="0x1AAF0000" />
+        <register type="NOA" address="0x00009888" value="0x10DE8000" />
+        <register type="NOA" address="0x00009888" value="0x1CDEE000" />
+        <register type="NOA" address="0x00009888" value="0x00E04000" />
+        <register type="NOA" address="0x00009888" value="0x0EE04000" />
+        <register type="NOA" address="0x00009888" value="0x18E04000" />
+        <register type="NOA" address="0x00009888" value="0x1AE00010" />
+        <register type="NOA" address="0x00009888" value="0x10E18000" />
+        <register type="NOA" address="0x00009888" value="0x1EE100E0" />
+        <register type="NOA" address="0x00009888" value="0x08EA1C30" />
+        <register type="NOA" address="0x00009888" value="0x10EA0000" />
+        <register type="NOA" address="0x00009888" value="0x00EAC000" />
+        <register type="NOA" address="0x00009888" value="0x0EEAC000" />
+        <register type="NOA" address="0x00009888" value="0x18EA0000" />
+        <register type="NOA" address="0x00009888" value="0x00EC4000" />
+        <register type="NOA" address="0x00009888" value="0x0EEC4000" />
+        <register type="NOA" address="0x00009888" value="0x18EC0005" />
+        <register type="NOA" address="0x00009888" value="0x00EF0040" />
+        <register type="NOA" address="0x00009888" value="0x06EF2400" />
+        <register type="NOA" address="0x00009888" value="0x10EF0000" />
+        <register type="NOA" address="0x00009888" value="0x0EEF0000" />
+        <register type="NOA" address="0x00009888" value="0x0C045400" />
+        <register type="NOA" address="0x00009888" value="0x0E045555" />
+        <register type="NOA" address="0x00009888" value="0x10040155" />
+        <register type="NOA" address="0x00009888" value="0x04055000" />
+        <register type="NOA" address="0x00009888" value="0x0A055000" />
+        <register type="NOA" address="0x00009888" value="0x0C055000" />
+        <register type="NOA" address="0x00009888" value="0x0E055000" />
+        <register type="NOA" address="0x00009888" value="0x14050055" />
+        <register type="NOA" address="0x00009888" value="0x06055000" />
+        <register type="NOA" address="0x00009888" value="0x08055000" />
+        <register type="NOA" address="0x00009888" value="0x2406FF00" />
+        <register type="NOA" address="0x00009888" value="0x260600FF" />
+        <register type="NOA" address="0x00009888" value="0x0E08A000" />
+        <register type="NOA" address="0x00009888" value="0x00088000" />
+        <register type="NOA" address="0x00009888" value="0x02082000" />
+        <register type="NOA" address="0x00009888" value="0x14090050" />
+        <register type="NOA" address="0x00009888" value="0x04094000" />
+        <register type="NOA" address="0x00009888" value="0x06091000" />
+        <register type="NOA" address="0x00009888" value="0x000D2000" />
+        <register type="NOA" address="0x00009888" value="0x060D8000" />
+        <register type="NOA" address="0x00009888" value="0x080DA000" />
+        <register type="NOA" address="0x00009888" value="0x040E1000" />
+        <register type="NOA" address="0x00009888" value="0x0A0E4000" />
+        <register type="NOA" address="0x00009888" value="0x0C0E5000" />
+        <register type="NOA" address="0x00009888" value="0x1812FC00" />
+        <register type="NOA" address="0x00009888" value="0x1A12002B" />
+        <register type="NOA" address="0x00009888" value="0x02128000" />
+        <register type="NOA" address="0x00009888" value="0x04128000" />
+        <register type="NOA" address="0x00009888" value="0x0813C000" />
+        <register type="NOA" address="0x00009888" value="0x0A13F000" />
+        <register type="NOA" address="0x00009888" value="0x04136000" />
+        <register type="NOA" address="0x00009888" value="0x0A14C000" />
+        <register type="NOA" address="0x00009888" value="0x0C14C000" />
+        <register type="NOA" address="0x00009888" value="0x0E14C000" />
+        <register type="NOA" address="0x00009888" value="0x00148000" />
+        <register type="NOA" address="0x00009888" value="0x02144000" />
+        <register type="NOA" address="0x00009888" value="0x00158000" />
+        <register type="NOA" address="0x00009888" value="0x0E158000" />
+        <register type="NOA" address="0x00009888" value="0x16152AD0" />
+        <register type="NOA" address="0x00009888" value="0x18150005" />
+        <register type="NOA" address="0x00009888" value="0x02154000" />
+        <register type="NOA" address="0x00009888" value="0x04154000" />
+        <register type="NOA" address="0x00009888" value="0x0615C000" />
+        <register type="NOA" address="0x00009888" value="0x0815C000" />
+        <register type="NOA" address="0x00009888" value="0x0A15C000" />
+        <register type="NOA" address="0x00009888" value="0x0C15C000" />
+        <register type="NOA" address="0x00009888" value="0x02188000" />
+        <register type="NOA" address="0x00009888" value="0x0418A000" />
+        <register type="NOA" address="0x00009888" value="0x06182000" />
+        <register type="NOA" address="0x00009888" value="0x0A198000" />
+        <register type="NOA" address="0x00009888" value="0x0C19A000" />
+        <register type="NOA" address="0x00009888" value="0x0E192000" />
+        <register type="NOA" address="0x00009888" value="0x0A1CA000" />
+        <register type="NOA" address="0x00009888" value="0x0C1CA000" />
+        <register type="NOA" address="0x00009888" value="0x121D5400" />
+        <register type="NOA" address="0x00009888" value="0x141D0002" />
+        <register type="NOA" address="0x00009884" value="0x00000003" />
+        <register type="NOA" address="0x00009888" value="0x301F8000" />
+        <register type="NOA" address="0x00009888" value="0x501F4924" />
+        <register type="NOA" address="0x00009888" value="0x521F4924" />
+        <register type="NOA" address="0x00009888" value="0x541F0024" />
+        <register type="NOA" address="0x00009888" value="0x3A1F8000" />
+        <register type="NOA" address="0x00009888" value="0x4E1F2400" />
+        <register type="NOA" address="0x00009888" value="0x3E1F3000" />
+        <register type="NOA" address="0x00009888" value="0x461F4030" />
+        <register type="NOA" address="0x00009888" value="0x481F0040" />
+        <register type="NOA" address="0x00009888" value="0x4A1F1000" />
+        <register type="NOA" address="0x00009888" value="0x4C1F0010" />
+        <register type="NOA" address="0x00009888" value="0x141F0000" />
+        <register type="NOA" address="0x00009888" value="0x401F1010" />
+        <register type="NOA" address="0x00009888" value="0x421F3030" />
+        <register type="NOA" address="0x00009888" value="0x441F4040" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002770" value="0x00000018" />
+        <register type="OA" address="0x00002774" value="0x0000FFFC" />
+        <register type="OA" address="0x00002778" value="0x00000060" />
+        <register type="OA" address="0x0000277C" value="0x0000FFF3" />
+        <register type="OA" address="0x00002780" value="0x00000180" />
+        <register type="OA" address="0x00002784" value="0x0000FFCF" />
+        <register type="OA" address="0x00002788" value="0x00000600" />
+        <register type="OA" address="0x0000278C" value="0x0000FF3F" />
+        <register type="OA" address="0x00002790" value="0x00001800" />
+        <register type="OA" address="0x00002794" value="0x0000FCFF" />
+        <register type="OA" address="0x00002798" value="0x00006000" />
+        <register type="OA" address="0x0000279C" value="0x0000F3FF" />
+        <register type="OA" address="0x000027A0" value="0x00018000" />
+        <register type="OA" address="0x000027A4" value="0x0000CFFF" />
+        <register type="OA" address="0x000027A8" value="0x00060000" />
+        <register type="OA" address="0x000027AC" value="0x00003FFF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+    </register_config>
+  </set>
+
+  <set name="Metric set Sampler 2"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="sampler_2"
+       hw_config_guid="58326100-b3e7-4554-b612-592e16dc6fd1"
+       chipset="LKF"
+       symbol_name="Sampler_2"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="B 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="Slice0 Subslice2 Sampler Output Ready"
+             description="The percentage of time in which slice0 subslice2 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler02_output_ready"
+             units="percent"
+             symbol_name="Sampler02OutputReady"
+             availability="$SubsliceMask 4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Slice0 Subslice6 Sampler Output Ready"
+             description="The percentage of time in which slice0 subslice6 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler06_output_ready"
+             units="percent"
+             symbol_name="Sampler06OutputReady"
+             availability="$SubsliceMask 64 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Slice0 Subslice4 Sampler Output Ready"
+             description="The percentage of time in which slice0 subslice4 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler04_output_ready"
+             units="percent"
+             symbol_name="Sampler04OutputReady"
+             availability="$SubsliceMask 16 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Slice0 Subslice3 Sampler Output Ready"
+             description="The percentage of time in which slice0 subslice3 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler03_output_ready"
+             units="percent"
+             symbol_name="Sampler03OutputReady"
+             availability="$SubsliceMask 8 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 Subslice7 Sampler Output Ready"
+             description="The percentage of time in which slice0 subslice7 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler07_output_ready"
+             units="percent"
+             symbol_name="Sampler07OutputReady"
+             availability="$SubsliceMask 128 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="Slice0 Subslice5 Sampler Output Ready"
+             description="The percentage of time in which slice0 subslice5 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler05_output_ready"
+             units="percent"
+             symbol_name="Sampler05OutputReady"
+             availability="$SubsliceMask 32 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Slice0 Subslice0 Sampler Output Ready"
+             description="The percentage of time in which slice0 subslice0 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler00_output_ready"
+             units="percent"
+             symbol_name="Sampler00OutputReady"
+             availability="$SubsliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Slice0 Subslice1 Sampler Output Ready"
+             description="The percentage of time in which slice0 subslice1 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler01_output_ready"
+             units="percent"
+             symbol_name="Sampler01OutputReady"
+             availability="$SubsliceMask 2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ A 31 READ UADD A 32 READ UADD 64 UMUL"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009840" value="0x00000000" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x142D0005" />
+        <register type="NOA" address="0x00009888" value="0x14320005" />
+        <register type="NOA" address="0x00009888" value="0x146D0005" />
+        <register type="NOA" address="0x00009888" value="0x14720005" />
+        <register type="NOA" address="0x00009888" value="0x14AD0005" />
+        <register type="NOA" address="0x00009888" value="0x14B20005" />
+        <register type="NOA" address="0x00009888" value="0x14ED0005" />
+        <register type="NOA" address="0x00009888" value="0x14F20005" />
+        <register type="NOA" address="0x00009888" value="0x1E1E0030" />
+        <register type="NOA" address="0x00009888" value="0x1A204000" />
+        <register type="NOA" address="0x00009888" value="0x1C200001" />
+        <register type="NOA" address="0x00009888" value="0x1E213000" />
+        <register type="NOA" address="0x00009888" value="0x1A2A00C0" />
+        <register type="NOA" address="0x00009888" value="0x182C6000" />
+        <register type="NOA" address="0x00009888" value="0x0E2D0033" />
+        <register type="NOA" address="0x00009888" value="0x022D0000" />
+        <register type="NOA" address="0x00009888" value="0x1A2F8000" />
+        <register type="NOA" address="0x00009888" value="0x1C300008" />
+        <register type="NOA" address="0x00009888" value="0x0E318000" />
+        <register type="NOA" address="0x00009888" value="0x0E321980" />
+        <register type="NOA" address="0x00009888" value="0x02320000" />
+        <register type="NOA" address="0x00009888" value="0x125E8000" />
+        <register type="NOA" address="0x00009888" value="0x145E8000" />
+        <register type="NOA" address="0x00009888" value="0x02604000" />
+        <register type="NOA" address="0x00009888" value="0x04604000" />
+        <register type="NOA" address="0x00009888" value="0x12618000" />
+        <register type="NOA" address="0x00009888" value="0x14618000" />
+        <register type="NOA" address="0x00009888" value="0x046AC000" />
+        <register type="NOA" address="0x00009888" value="0x026C8000" />
+        <register type="NOA" address="0x00009888" value="0x046C4000" />
+        <register type="NOA" address="0x00009888" value="0x006D1980" />
+        <register type="NOA" address="0x00009888" value="0x026D0000" />
+        <register type="NOA" address="0x00009888" value="0x046F8000" />
+        <register type="NOA" address="0x00009888" value="0x14708000" />
+        <register type="NOA" address="0x00009888" value="0x02714000" />
+        <register type="NOA" address="0x00009888" value="0x02720033" />
+        <register type="NOA" address="0x00009888" value="0x169E8000" />
+        <register type="NOA" address="0x00009888" value="0x189E8000" />
+        <register type="NOA" address="0x00009888" value="0x06A04000" />
+        <register type="NOA" address="0x00009888" value="0x08A04000" />
+        <register type="NOA" address="0x00009888" value="0x16A18000" />
+        <register type="NOA" address="0x00009888" value="0x18A18000" />
+        <register type="NOA" address="0x00009888" value="0x08AAC000" />
+        <register type="NOA" address="0x00009888" value="0x06AC8000" />
+        <register type="NOA" address="0x00009888" value="0x08AC4000" />
+        <register type="NOA" address="0x00009888" value="0x02AD1980" />
+        <register type="NOA" address="0x00009888" value="0x08AF8000" />
+        <register type="NOA" address="0x00009888" value="0x18B04000" />
+        <register type="NOA" address="0x00009888" value="0x04B14000" />
+        <register type="NOA" address="0x00009888" value="0x04B20033" />
+        <register type="NOA" address="0x00009888" value="0x02B20000" />
+        <register type="NOA" address="0x00009888" value="0x1CDE1800" />
+        <register type="NOA" address="0x00009888" value="0x0AE04000" />
+        <register type="NOA" address="0x00009888" value="0x0CE04000" />
+        <register type="NOA" address="0x00009888" value="0x1EE10018" />
+        <register type="NOA" address="0x00009888" value="0x0CEAC000" />
+        <register type="NOA" address="0x00009888" value="0x0AEC8000" />
+        <register type="NOA" address="0x00009888" value="0x0CEC4000" />
+        <register type="NOA" address="0x00009888" value="0x04ED1980" />
+        <register type="NOA" address="0x00009888" value="0x02ED0000" />
+        <register type="NOA" address="0x00009888" value="0x0CEF8000" />
+        <register type="NOA" address="0x00009888" value="0x1AF00400" />
+        <register type="NOA" address="0x00009888" value="0x06F14000" />
+        <register type="NOA" address="0x00009888" value="0x06F20033" />
+        <register type="NOA" address="0x00009888" value="0x02F20000" />
+        <register type="NOA" address="0x00009888" value="0x10040140" />
+        <register type="NOA" address="0x00009888" value="0x0C045000" />
+        <register type="NOA" address="0x00009888" value="0x0E040055" />
+        <register type="NOA" address="0x00009888" value="0x14050050" />
+        <register type="NOA" address="0x00009888" value="0x04054000" />
+        <register type="NOA" address="0x00009888" value="0x06055000" />
+        <register type="NOA" address="0x00009888" value="0x08055000" />
+        <register type="NOA" address="0x00009888" value="0x0A051000" />
+        <register type="NOA" address="0x00009888" value="0x260600C0" />
+        <register type="NOA" address="0x00009888" value="0x24067E00" />
+        <register type="NOA" address="0x00009888" value="0x00088000" />
+        <register type="NOA" address="0x00009888" value="0x02082000" />
+        <register type="NOA" address="0x00009888" value="0x04094000" />
+        <register type="NOA" address="0x00009888" value="0x06091000" />
+        <register type="NOA" address="0x00009888" value="0x040D8000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x080E4000" />
+        <register type="NOA" address="0x00009888" value="0x0A0E1000" />
+        <register type="NOA" address="0x00009888" value="0x02128000" />
+        <register type="NOA" address="0x00009888" value="0x04128000" />
+        <register type="NOA" address="0x00009888" value="0x0612C000" />
+        <register type="NOA" address="0x00009888" value="0x0812C000" />
+        <register type="NOA" address="0x00009888" value="0x0413E000" />
+        <register type="NOA" address="0x00009888" value="0x06131000" />
+        <register type="NOA" address="0x00009888" value="0x00148000" />
+        <register type="NOA" address="0x00009888" value="0x0214C000" />
+        <register type="NOA" address="0x00009888" value="0x04144000" />
+        <register type="NOA" address="0x00009888" value="0x1815000F" />
+        <register type="NOA" address="0x00009888" value="0x02154000" />
+        <register type="NOA" address="0x00009888" value="0x04154000" />
+        <register type="NOA" address="0x00009888" value="0x06154000" />
+        <register type="NOA" address="0x00009888" value="0x08154000" />
+        <register type="NOA" address="0x00009888" value="0x0A158000" />
+        <register type="NOA" address="0x00009888" value="0x0C158000" />
+        <register type="NOA" address="0x00009888" value="0x0E18A000" />
+        <register type="NOA" address="0x00009888" value="0x14190028" />
+        <register type="NOA" address="0x00009888" value="0x021C8000" />
+        <register type="NOA" address="0x00009888" value="0x041C2000" />
+        <register type="NOA" address="0x00009888" value="0x0A1D8000" />
+        <register type="NOA" address="0x00009888" value="0x0C1D2000" />
+        <register type="NOA" address="0x00009884" value="0x00000003" />
+        <register type="NOA" address="0x00009888" value="0x1C1F3000" />
+        <register type="NOA" address="0x00009888" value="0x2A1F0061" />
+        <register type="NOA" address="0x00009888" value="0x141F0000" />
+        <register type="NOA" address="0x00009888" value="0x521F0000" />
+        <register type="NOA" address="0x00009888" value="0x541F0024" />
+        <register type="NOA" address="0x00009888" value="0x3A1F8000" />
+        <register type="NOA" address="0x00009888" value="0x4E1F2430" />
+        <register type="NOA" address="0x00009888" value="0x501F0124" />
+        <register type="NOA" address="0x00009888" value="0x4C1F0137" />
+        <register type="NOA" address="0x00009888" value="0x301F0000" />
+        <register type="NOA" address="0x00009888" value="0x401F0040" />
+        <register type="NOA" address="0x00009888" value="0x421F0040" />
+        <register type="NOA" address="0x00009888" value="0x441F3001" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+    </register_config>
+  </set>
+
+  <set name="Metric set TDL_1"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="tdl_1"
+       hw_config_guid="4c71735a-dfbf-4ebe-9df3-6c3db344a466"
+       chipset="LKF"
+       symbol_name="TDL_1"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Subslice3 Thread Dispatcher"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice3 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread03_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread03ReadyForDispatch"
+             availability="$SubsliceMask 8 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="FS AVG Stall per Thread"
+             description="The average number of cycles per hardware thread run in which fragment shaders were stalled on the EUs."
+             data_type="uint64"
+             equation="A 20 READ A 6 READ UDIV"
+             underscore_name="ps_eu_stall_per_thread"
+             units="cycles"
+             symbol_name="PsEuStallPerThread"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS AVG Stall per Thread"
+             description="The average number of cycles per hardware thread run in which vertex shaders were stalled on the EUs."
+             data_type="uint64"
+             equation="A 14 READ A 1 READ UDIV"
+             underscore_name="vs_eu_stall_per_thread"
+             units="cycles"
+             symbol_name="VsEuStallPerThread"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="FS AVG Active per Thread"
+             description="The average number of cycles per hardware thread run in which fragment shaders were processed actively on the EUs."
+             data_type="uint64"
+             equation="A 19 READ A 6 READ UDIV"
+             underscore_name="ps_eu_active_per_thread"
+             units="cycles"
+             symbol_name="PsEuActivePerThread"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="FS EU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 19 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_active"
+             units="percent"
+             symbol_name="PsEuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Subslice0 Thread Dispatcher"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice0 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread00_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread00ReadyForDispatch"
+             availability="$SubsliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Subslice7 Thread Dispatcher"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice7 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread07_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread07ReadyForDispatch"
+             availability="$SubsliceMask 128 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="FS EU Stall"
+             description="The percentage of time in which fragment shaders were stalled on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 20 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_stall"
+             units="percent"
+             symbol_name="PsEuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Subslice5 Thread Dispatcher"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice5 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread05_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread05ReadyForDispatch"
+             availability="$SubsliceMask 32 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="VS EU Active"
+             description="The percentage of time in which vertex shaders were processed actively on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_eu_active"
+             units="percent"
+             symbol_name="VsEuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Subslice1 Thread Dispatcher"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice1 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread01_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread01ReadyForDispatch"
+             availability="$SubsliceMask 2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Subslice4 Thread Dispatcher"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice4 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread04_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread04ReadyForDispatch"
+             availability="$SubsliceMask 16 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="VS EU Stall"
+             description="The percentage of time in which vertex shaders were stalled on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 14 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_eu_stall"
+             units="percent"
+             symbol_name="VsEuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="VS AVG Active per Thread"
+             description="The average number of cycles per hardware thread run in which vertex shaders were processed actively on the EUs."
+             data_type="uint64"
+             equation="A 13 READ A 1 READ UDIV"
+             underscore_name="vs_eu_active_per_thread"
+             units="cycles"
+             symbol_name="VsEuActivePerThread"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Subslice2 Thread Dispatcher"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice2 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread02_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread02ReadyForDispatch"
+             availability="$SubsliceMask 4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ A 31 READ UADD A 32 READ UADD 64 UMUL"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Subslice6 Thread Dispatcher"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice6 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread06_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread06ReadyForDispatch"
+             availability="$SubsliceMask 64 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009840" value="0x00000000" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x14290000" />
+        <register type="NOA" address="0x00009888" value="0x142E0000" />
+        <register type="NOA" address="0x00009888" value="0x14690000" />
+        <register type="NOA" address="0x00009888" value="0x146E0000" />
+        <register type="NOA" address="0x00009888" value="0x14A90000" />
+        <register type="NOA" address="0x00009888" value="0x14AE0000" />
+        <register type="NOA" address="0x00009888" value="0x14E90000" />
+        <register type="NOA" address="0x00009888" value="0x14EE0000" />
+        <register type="NOA" address="0x00009888" value="0x161E8000" />
+        <register type="NOA" address="0x00009888" value="0x181E8000" />
+        <register type="NOA" address="0x00009888" value="0x1C1E1800" />
+        <register type="NOA" address="0x00009888" value="0x06204000" />
+        <register type="NOA" address="0x00009888" value="0x08204000" />
+        <register type="NOA" address="0x00009888" value="0x0A204000" />
+        <register type="NOA" address="0x00009888" value="0x0C204000" />
+        <register type="NOA" address="0x00009888" value="0x16218000" />
+        <register type="NOA" address="0x00009888" value="0x18218000" />
+        <register type="NOA" address="0x00009888" value="0x1E210018" />
+        <register type="NOA" address="0x00009888" value="0x0429C300" />
+        <register type="NOA" address="0x00009888" value="0x062900C5" />
+        <register type="NOA" address="0x00009888" value="0x10290000" />
+        <register type="NOA" address="0x00009888" value="0x062AC000" />
+        <register type="NOA" address="0x00009888" value="0x082AC000" />
+        <register type="NOA" address="0x00009888" value="0x0A2A4000" />
+        <register type="NOA" address="0x00009888" value="0x0C2A4000" />
+        <register type="NOA" address="0x00009888" value="0x062C4000" />
+        <register type="NOA" address="0x00009888" value="0x082C4000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C4000" />
+        <register type="NOA" address="0x00009888" value="0x0C2C4000" />
+        <register type="NOA" address="0x00009888" value="0x022EC300" />
+        <register type="NOA" address="0x00009888" value="0x042E00C5" />
+        <register type="NOA" address="0x00009888" value="0x102E0000" />
+        <register type="NOA" address="0x00009888" value="0x062F4000" />
+        <register type="NOA" address="0x00009888" value="0x082F4000" />
+        <register type="NOA" address="0x00009888" value="0x1E5E0030" />
+        <register type="NOA" address="0x00009888" value="0x125E8000" />
+        <register type="NOA" address="0x00009888" value="0x145E8000" />
+        <register type="NOA" address="0x00009888" value="0x1A604000" />
+        <register type="NOA" address="0x00009888" value="0x1C600001" />
+        <register type="NOA" address="0x00009888" value="0x02604000" />
+        <register type="NOA" address="0x00009888" value="0x04604000" />
+        <register type="NOA" address="0x00009888" value="0x1E613000" />
+        <register type="NOA" address="0x00009888" value="0x12618000" />
+        <register type="NOA" address="0x00009888" value="0x14618000" />
+        <register type="NOA" address="0x00009888" value="0x0069C300" />
+        <register type="NOA" address="0x00009888" value="0x026900C5" />
+        <register type="NOA" address="0x00009888" value="0x10690000" />
+        <register type="NOA" address="0x00009888" value="0x1A6A00F0" />
+        <register type="NOA" address="0x00009888" value="0x026A4000" />
+        <register type="NOA" address="0x00009888" value="0x046A4000" />
+        <register type="NOA" address="0x00009888" value="0x186C5000" />
+        <register type="NOA" address="0x00009888" value="0x026C4000" />
+        <register type="NOA" address="0x00009888" value="0x046C4000" />
+        <register type="NOA" address="0x00009888" value="0x0E6EC5C3" />
+        <register type="NOA" address="0x00009888" value="0x106E0000" />
+        <register type="NOA" address="0x00009888" value="0x1A6F5000" />
+        <register type="NOA" address="0x00009888" value="0x1E9E000F" />
+        <register type="NOA" address="0x00009888" value="0x1AA01540" />
+        <register type="NOA" address="0x00009888" value="0x1EA10F00" />
+        <register type="NOA" address="0x00009888" value="0x0CA9C5C3" />
+        <register type="NOA" address="0x00009888" value="0x10A90000" />
+        <register type="NOA" address="0x00009888" value="0x18AAF000" />
+        <register type="NOA" address="0x00009888" value="0x1AAA0005" />
+        <register type="NOA" address="0x00009888" value="0x18AC0550" />
+        <register type="NOA" address="0x00009888" value="0x0AAEC5C3" />
+        <register type="NOA" address="0x00009888" value="0x10AE0000" />
+        <register type="NOA" address="0x00009888" value="0x1AAF0050" />
+        <register type="NOA" address="0x00009888" value="0x10DE8000" />
+        <register type="NOA" address="0x00009888" value="0x1CDEE000" />
+        <register type="NOA" address="0x00009888" value="0x00E04000" />
+        <register type="NOA" address="0x00009888" value="0x0EE04000" />
+        <register type="NOA" address="0x00009888" value="0x18E04000" />
+        <register type="NOA" address="0x00009888" value="0x1AE00010" />
+        <register type="NOA" address="0x00009888" value="0x10E18000" />
+        <register type="NOA" address="0x00009888" value="0x1EE100E0" />
+        <register type="NOA" address="0x00009888" value="0x08E9C5C3" />
+        <register type="NOA" address="0x00009888" value="0x10E90000" />
+        <register type="NOA" address="0x00009888" value="0x00EAC000" />
+        <register type="NOA" address="0x00009888" value="0x0EEAC000" />
+        <register type="NOA" address="0x00009888" value="0x18EA0500" />
+        <register type="NOA" address="0x00009888" value="0x00EC4000" />
+        <register type="NOA" address="0x00009888" value="0x0EEC4000" />
+        <register type="NOA" address="0x00009888" value="0x18EC0005" />
+        <register type="NOA" address="0x00009888" value="0x00EE00C3" />
+        <register type="NOA" address="0x00009888" value="0x06EEC500" />
+        <register type="NOA" address="0x00009888" value="0x10EE0000" />
+        <register type="NOA" address="0x00009888" value="0x00EF4000" />
+        <register type="NOA" address="0x00009888" value="0x0EEF4000" />
+        <register type="NOA" address="0x00009888" value="0x0C045400" />
+        <register type="NOA" address="0x00009888" value="0x0E045555" />
+        <register type="NOA" address="0x00009888" value="0x10040155" />
+        <register type="NOA" address="0x00009888" value="0x04055000" />
+        <register type="NOA" address="0x00009888" value="0x0A055000" />
+        <register type="NOA" address="0x00009888" value="0x0C055000" />
+        <register type="NOA" address="0x00009888" value="0x0E055000" />
+        <register type="NOA" address="0x00009888" value="0x14050055" />
+        <register type="NOA" address="0x00009888" value="0x06055000" />
+        <register type="NOA" address="0x00009888" value="0x08055000" />
+        <register type="NOA" address="0x00009888" value="0x2406FF00" />
+        <register type="NOA" address="0x00009888" value="0x260600FF" />
+        <register type="NOA" address="0x00009888" value="0x0E08A000" />
+        <register type="NOA" address="0x00009888" value="0x00088000" />
+        <register type="NOA" address="0x00009888" value="0x02082000" />
+        <register type="NOA" address="0x00009888" value="0x14090050" />
+        <register type="NOA" address="0x00009888" value="0x04094000" />
+        <register type="NOA" address="0x00009888" value="0x06091000" />
+        <register type="NOA" address="0x00009888" value="0x000D2000" />
+        <register type="NOA" address="0x00009888" value="0x060D8000" />
+        <register type="NOA" address="0x00009888" value="0x080DA000" />
+        <register type="NOA" address="0x00009888" value="0x040E1000" />
+        <register type="NOA" address="0x00009888" value="0x0A0E4000" />
+        <register type="NOA" address="0x00009888" value="0x0C0E5000" />
+        <register type="NOA" address="0x00009888" value="0x1812FC00" />
+        <register type="NOA" address="0x00009888" value="0x1A12002B" />
+        <register type="NOA" address="0x00009888" value="0x02128000" />
+        <register type="NOA" address="0x00009888" value="0x04128000" />
+        <register type="NOA" address="0x00009888" value="0x0813C000" />
+        <register type="NOA" address="0x00009888" value="0x0A13F000" />
+        <register type="NOA" address="0x00009888" value="0x04136000" />
+        <register type="NOA" address="0x00009888" value="0x0A14C000" />
+        <register type="NOA" address="0x00009888" value="0x0C14C000" />
+        <register type="NOA" address="0x00009888" value="0x0E14C000" />
+        <register type="NOA" address="0x00009888" value="0x00148000" />
+        <register type="NOA" address="0x00009888" value="0x02144000" />
+        <register type="NOA" address="0x00009888" value="0x00158000" />
+        <register type="NOA" address="0x00009888" value="0x0E158000" />
+        <register type="NOA" address="0x00009888" value="0x16152AD0" />
+        <register type="NOA" address="0x00009888" value="0x18150005" />
+        <register type="NOA" address="0x00009888" value="0x02154000" />
+        <register type="NOA" address="0x00009888" value="0x04154000" />
+        <register type="NOA" address="0x00009888" value="0x0615C000" />
+        <register type="NOA" address="0x00009888" value="0x0815C000" />
+        <register type="NOA" address="0x00009888" value="0x0A15C000" />
+        <register type="NOA" address="0x00009888" value="0x0C15C000" />
+        <register type="NOA" address="0x00009888" value="0x02188000" />
+        <register type="NOA" address="0x00009888" value="0x0418A000" />
+        <register type="NOA" address="0x00009888" value="0x06182000" />
+        <register type="NOA" address="0x00009888" value="0x0A198000" />
+        <register type="NOA" address="0x00009888" value="0x0C19A000" />
+        <register type="NOA" address="0x00009888" value="0x0E192000" />
+        <register type="NOA" address="0x00009888" value="0x0A1CA000" />
+        <register type="NOA" address="0x00009888" value="0x0C1CA000" />
+        <register type="NOA" address="0x00009888" value="0x121D5400" />
+        <register type="NOA" address="0x00009888" value="0x141D0002" />
+        <register type="NOA" address="0x00009884" value="0x00000003" />
+        <register type="NOA" address="0x00009888" value="0x301F8000" />
+        <register type="NOA" address="0x00009888" value="0x501F4924" />
+        <register type="NOA" address="0x00009888" value="0x521F4924" />
+        <register type="NOA" address="0x00009888" value="0x541F0024" />
+        <register type="NOA" address="0x00009888" value="0x3A1F8000" />
+        <register type="NOA" address="0x00009888" value="0x4E1F2400" />
+        <register type="NOA" address="0x00009888" value="0x3E1F3000" />
+        <register type="NOA" address="0x00009888" value="0x461F4030" />
+        <register type="NOA" address="0x00009888" value="0x481F0040" />
+        <register type="NOA" address="0x00009888" value="0x4A1F1000" />
+        <register type="NOA" address="0x00009888" value="0x4C1F0010" />
+        <register type="NOA" address="0x00009888" value="0x141F0000" />
+        <register type="NOA" address="0x00009888" value="0x401F1010" />
+        <register type="NOA" address="0x00009888" value="0x421F3030" />
+        <register type="NOA" address="0x00009888" value="0x441F4040" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002770" value="0x00000018" />
+        <register type="OA" address="0x00002774" value="0x0000FFFC" />
+        <register type="OA" address="0x00002778" value="0x00000060" />
+        <register type="OA" address="0x0000277C" value="0x0000FFF3" />
+        <register type="OA" address="0x00002780" value="0x00000180" />
+        <register type="OA" address="0x00002784" value="0x0000FFCF" />
+        <register type="OA" address="0x00002788" value="0x00000600" />
+        <register type="OA" address="0x0000278C" value="0x0000FF3F" />
+        <register type="OA" address="0x00002790" value="0x00001800" />
+        <register type="OA" address="0x00002794" value="0x0000FCFF" />
+        <register type="OA" address="0x00002798" value="0x00006000" />
+        <register type="OA" address="0x0000279C" value="0x0000F3FF" />
+        <register type="OA" address="0x000027A0" value="0x00018000" />
+        <register type="OA" address="0x000027A4" value="0x0000CFFF" />
+        <register type="OA" address="0x000027A8" value="0x00060000" />
+        <register type="OA" address="0x000027AC" value="0x00003FFF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set TDL_2"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="tdl_2"
+       hw_config_guid="80e75f86-f8bc-4903-bf0f-38fd26cca636"
+       chipset="LKF"
+       symbol_name="TDL_2"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Non-PS Thread Ready For Dispatch on Slice0 Subslice2 Thread Dispatcher"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice2 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="GPU_CLOCK 0 READ C 1 READ FSUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread02_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread02ReadyForDispatch"
+             availability="$SubsliceMask 4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Non-PS Thread Ready For Dispatch on Slice0 Subslice3 Thread Dispatcher"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice3 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="GPU_CLOCK 0 READ C 2 READ FSUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread03_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread03ReadyForDispatch"
+             availability="$SubsliceMask 8 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="Non-PS Thread Ready For Dispatch on Slice0 Subslice0 Thread Dispatcher"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice0 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="GPU_CLOCK 0 READ B 7 READ FSUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread00_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread00ReadyForDispatch"
+             availability="$SubsliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Non-PS Thread Ready For Dispatch on Slice0 Subslice7 Thread Dispatcher"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice7 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="GPU_CLOCK 0 READ C 6 READ FSUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread07_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread07ReadyForDispatch"
+             availability="$SubsliceMask 128 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Non-PS Thread Ready For Dispatch on Slice0 Subslice6 Thread Dispatcher"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice6 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="GPU_CLOCK 0 READ C 5 READ FSUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread06_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread06ReadyForDispatch"
+             availability="$SubsliceMask 64 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="Non-PS Thread Ready For Dispatch on Slice0 Subslice5 Thread Dispatcher"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice5 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="GPU_CLOCK 0 READ C 4 READ FSUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread05_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread05ReadyForDispatch"
+             availability="$SubsliceMask 32 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Non-PS Thread Ready For Dispatch on Slice0 Subslice4 Thread Dispatcher"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice4 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="GPU_CLOCK 0 READ C 3 READ FSUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread04_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread04ReadyForDispatch"
+             availability="$SubsliceMask 16 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ A 31 READ UADD A 32 READ UADD 64 UMUL"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="Non-PS Thread Ready For Dispatch on Slice0 Subslice1 Thread Dispatcher"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice1 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="GPU_CLOCK 0 READ C 0 READ FSUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread01_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread01ReadyForDispatch"
+             availability="$SubsliceMask 2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009840" value="0x00000000" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x14290000" />
+        <register type="NOA" address="0x00009888" value="0x142E0000" />
+        <register type="NOA" address="0x00009888" value="0x14690000" />
+        <register type="NOA" address="0x00009888" value="0x146E0000" />
+        <register type="NOA" address="0x00009888" value="0x14A90000" />
+        <register type="NOA" address="0x00009888" value="0x14AE0000" />
+        <register type="NOA" address="0x00009888" value="0x14E90000" />
+        <register type="NOA" address="0x00009888" value="0x14EE0000" />
+        <register type="NOA" address="0x00009888" value="0x1E1E0018" />
+        <register type="NOA" address="0x00009888" value="0x1A205000" />
+        <register type="NOA" address="0x00009888" value="0x1E211800" />
+        <register type="NOA" address="0x00009888" value="0x0C29C100" />
+        <register type="NOA" address="0x00009888" value="0x10290000" />
+        <register type="NOA" address="0x00009888" value="0x1A2A0034" />
+        <register type="NOA" address="0x00009888" value="0x182C1400" />
+        <register type="NOA" address="0x00009888" value="0x0E2E00C1" />
+        <register type="NOA" address="0x00009888" value="0x102E0000" />
+        <register type="NOA" address="0x00009888" value="0x1A2F1000" />
+        <register type="NOA" address="0x00009888" value="0x1E5E0020" />
+        <register type="NOA" address="0x00009888" value="0x125E8000" />
+        <register type="NOA" address="0x00009888" value="0x1C600001" />
+        <register type="NOA" address="0x00009888" value="0x02604000" />
+        <register type="NOA" address="0x00009888" value="0x1E612000" />
+        <register type="NOA" address="0x00009888" value="0x12618000" />
+        <register type="NOA" address="0x00009888" value="0x0E69C100" />
+        <register type="NOA" address="0x00009888" value="0x10690000" />
+        <register type="NOA" address="0x00009888" value="0x1A6A0040" />
+        <register type="NOA" address="0x00009888" value="0x026AC000" />
+        <register type="NOA" address="0x00009888" value="0x186C4000" />
+        <register type="NOA" address="0x00009888" value="0x026C4000" />
+        <register type="NOA" address="0x00009888" value="0x006EC100" />
+        <register type="NOA" address="0x00009888" value="0x106E0000" />
+        <register type="NOA" address="0x00009888" value="0x026F4000" />
+        <register type="NOA" address="0x00009888" value="0x149E8000" />
+        <register type="NOA" address="0x00009888" value="0x169E8000" />
+        <register type="NOA" address="0x00009888" value="0x04A04000" />
+        <register type="NOA" address="0x00009888" value="0x06A04000" />
+        <register type="NOA" address="0x00009888" value="0x14A18000" />
+        <register type="NOA" address="0x00009888" value="0x16A18000" />
+        <register type="NOA" address="0x00009888" value="0x02A900C1" />
+        <register type="NOA" address="0x00009888" value="0x10A90000" />
+        <register type="NOA" address="0x00009888" value="0x04AA4000" />
+        <register type="NOA" address="0x00009888" value="0x06AAC000" />
+        <register type="NOA" address="0x00009888" value="0x04AC4000" />
+        <register type="NOA" address="0x00009888" value="0x06AC4000" />
+        <register type="NOA" address="0x00009888" value="0x02AEC100" />
+        <register type="NOA" address="0x00009888" value="0x10AE0000" />
+        <register type="NOA" address="0x00009888" value="0x06AF4000" />
+        <register type="NOA" address="0x00009888" value="0x18DE8000" />
+        <register type="NOA" address="0x00009888" value="0x1CDE0800" />
+        <register type="NOA" address="0x00009888" value="0x08E04000" />
+        <register type="NOA" address="0x00009888" value="0x0AE04000" />
+        <register type="NOA" address="0x00009888" value="0x18E18000" />
+        <register type="NOA" address="0x00009888" value="0x1EE10008" />
+        <register type="NOA" address="0x00009888" value="0x04E900C1" />
+        <register type="NOA" address="0x00009888" value="0x10E90000" />
+        <register type="NOA" address="0x00009888" value="0x08EA4000" />
+        <register type="NOA" address="0x00009888" value="0x0AEAC000" />
+        <register type="NOA" address="0x00009888" value="0x08EC4000" />
+        <register type="NOA" address="0x00009888" value="0x0AEC4000" />
+        <register type="NOA" address="0x00009888" value="0x04EEC100" />
+        <register type="NOA" address="0x00009888" value="0x10EE0000" />
+        <register type="NOA" address="0x00009888" value="0x0AEF4000" />
+        <register type="NOA" address="0x00009888" value="0x10040150" />
+        <register type="NOA" address="0x00009888" value="0x0C045000" />
+        <register type="NOA" address="0x00009888" value="0x0E040015" />
+        <register type="NOA" address="0x00009888" value="0x14050054" />
+        <register type="NOA" address="0x00009888" value="0x04054000" />
+        <register type="NOA" address="0x00009888" value="0x06055000" />
+        <register type="NOA" address="0x00009888" value="0x08055000" />
+        <register type="NOA" address="0x00009888" value="0x260600E0" />
+        <register type="NOA" address="0x00009888" value="0x24063E00" />
+        <register type="NOA" address="0x00009888" value="0x0E088000" />
+        <register type="NOA" address="0x00009888" value="0x00088000" />
+        <register type="NOA" address="0x00009888" value="0x14090040" />
+        <register type="NOA" address="0x00009888" value="0x04094000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x080E5000" />
+        <register type="NOA" address="0x00009888" value="0x1A120020" />
+        <register type="NOA" address="0x00009888" value="0x02128000" />
+        <register type="NOA" address="0x00009888" value="0x0412C000" />
+        <register type="NOA" address="0x00009888" value="0x0612C000" />
+        <register type="NOA" address="0x00009888" value="0x0A138000" />
+        <register type="NOA" address="0x00009888" value="0x0413E000" />
+        <register type="NOA" address="0x00009888" value="0x0E148000" />
+        <register type="NOA" address="0x00009888" value="0x00148000" />
+        <register type="NOA" address="0x00009888" value="0x0214C000" />
+        <register type="NOA" address="0x00009888" value="0x16156000" />
+        <register type="NOA" address="0x00009888" value="0x18150007" />
+        <register type="NOA" address="0x00009888" value="0x02154000" />
+        <register type="NOA" address="0x00009888" value="0x04154000" />
+        <register type="NOA" address="0x00009888" value="0x06154000" />
+        <register type="NOA" address="0x00009888" value="0x08158000" />
+        <register type="NOA" address="0x00009888" value="0x0A158000" />
+        <register type="NOA" address="0x00009888" value="0x0C188000" />
+        <register type="NOA" address="0x00009888" value="0x0E182000" />
+        <register type="NOA" address="0x00009888" value="0x1419000A" />
+        <register type="NOA" address="0x00009888" value="0x021CA000" />
+        <register type="NOA" address="0x00009888" value="0x0A1DA000" />
+        <register type="NOA" address="0x00009884" value="0x00000003" />
+        <register type="NOA" address="0x00009888" value="0x1C1F3061" />
+        <register type="NOA" address="0x00009888" value="0x141F0000" />
+        <register type="NOA" address="0x00009888" value="0x521F4000" />
+        <register type="NOA" address="0x00009888" value="0x541F0024" />
+        <register type="NOA" address="0x00009888" value="0x3A1F8000" />
+        <register type="NOA" address="0x00009888" value="0x4E1F2410" />
+        <register type="NOA" address="0x00009888" value="0x501F0024" />
+        <register type="NOA" address="0x00009888" value="0x4C1F3040" />
+        <register type="NOA" address="0x00009888" value="0x301F0000" />
+        <register type="NOA" address="0x00009888" value="0x401F1000" />
+        <register type="NOA" address="0x00009888" value="0x421F4000" />
+        <register type="NOA" address="0x00009888" value="0x441F1730" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+    </register_config>
+  </set>
+
+  <set name="Metric set TDL_3"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="tdl_3"
+       hw_config_guid="9c517add-e263-4cbe-b7f8-9986f737e68a"
+       chipset="LKF"
+       symbol_name="TDL_3"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice6 Thread Dispatcher Port 1"
+             description="The percentage of time in which thread header is ready on slice0 subslice6 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header06_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader06ReadyPort1"
+             availability="$SubsliceMask 64 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice3 Thread Dispatcher Port 0"
+             description="The percentage of time in which thread header is ready on slice0 subslice3 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="B 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header03_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader03ReadyPort0"
+             availability="$SubsliceMask 8 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice3 Thread Dispatcher Port 1"
+             description="The percentage of time in which thread header is ready on slice0 subslice3 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="B 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header03_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader03ReadyPort1"
+             availability="$SubsliceMask 8 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice4 Thread Dispatcher Port 1"
+             description="The percentage of time in which thread header is ready on slice0 subslice4 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header04_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader04ReadyPort1"
+             availability="$SubsliceMask 16 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice4 Thread Dispatcher Port 0"
+             description="The percentage of time in which thread header is ready on slice0 subslice4 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header04_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader04ReadyPort0"
+             availability="$SubsliceMask 16 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice6 Thread Dispatcher Port 0"
+             description="The percentage of time in which thread header is ready on slice0 subslice6 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header06_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader06ReadyPort0"
+             availability="$SubsliceMask 64 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice1 Thread Dispatcher Port 0"
+             description="The percentage of time in which thread header is ready on slice0 subslice1 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header01_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader01ReadyPort0"
+             availability="$SubsliceMask 2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice1 Thread Dispatcher Port 1"
+             description="The percentage of time in which thread header is ready on slice0 subslice1 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header01_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader01ReadyPort1"
+             availability="$SubsliceMask 2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice7 Thread Dispatcher Port 0"
+             description="The percentage of time in which thread header is ready on slice0 subslice7 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header07_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader07ReadyPort0"
+             availability="$SubsliceMask 128 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice2 Thread Dispatcher Port 1"
+             description="The percentage of time in which thread header is ready on slice0 subslice2 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="B 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header02_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader02ReadyPort1"
+             availability="$SubsliceMask 4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice2 Thread Dispatcher Port 0"
+             description="The percentage of time in which thread header is ready on slice0 subslice2 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header02_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader02ReadyPort0"
+             availability="$SubsliceMask 4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice5 Thread Dispatcher Port 0"
+             description="The percentage of time in which thread header is ready on slice0 subslice5 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header05_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader05ReadyPort0"
+             availability="$SubsliceMask 32 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice7 Thread Dispatcher Port 1"
+             description="The percentage of time in which thread header is ready on slice0 subslice7 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header07_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader07ReadyPort1"
+             availability="$SubsliceMask 128 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ A 31 READ UADD A 32 READ UADD 64 UMUL"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice5 Thread Dispatcher Port 1"
+             description="The percentage of time in which thread header is ready on slice0 subslice5 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header05_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader05ReadyPort1"
+             availability="$SubsliceMask 32 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice0 Thread Dispatcher Port 0"
+             description="The percentage of time in which thread header is ready on slice0 subslice0 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header00_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader00ReadyPort0"
+             availability="$SubsliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice0 Thread Dispatcher Port 1"
+             description="The percentage of time in which thread header is ready on slice0 subslice0 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header00_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader00ReadyPort1"
+             availability="$SubsliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009840" value="0x00000000" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x14292C00" />
+        <register type="NOA" address="0x00009888" value="0x16290013" />
+        <register type="NOA" address="0x00009888" value="0x142E2C00" />
+        <register type="NOA" address="0x00009888" value="0x162E0013" />
+        <register type="NOA" address="0x00009888" value="0x14692C00" />
+        <register type="NOA" address="0x00009888" value="0x16690013" />
+        <register type="NOA" address="0x00009888" value="0x146E2C00" />
+        <register type="NOA" address="0x00009888" value="0x166E0013" />
+        <register type="NOA" address="0x00009888" value="0x14A92C00" />
+        <register type="NOA" address="0x00009888" value="0x16A90013" />
+        <register type="NOA" address="0x00009888" value="0x14AE2C00" />
+        <register type="NOA" address="0x00009888" value="0x16AE0013" />
+        <register type="NOA" address="0x00009888" value="0x14E92C00" />
+        <register type="NOA" address="0x00009888" value="0x16E90013" />
+        <register type="NOA" address="0x00009888" value="0x14EE2C00" />
+        <register type="NOA" address="0x00009888" value="0x16EE0013" />
+        <register type="NOA" address="0x00009888" value="0x101E8000" />
+        <register type="NOA" address="0x00009888" value="0x1C1EE000" />
+        <register type="NOA" address="0x00009888" value="0x00204000" />
+        <register type="NOA" address="0x00009888" value="0x0E204000" />
+        <register type="NOA" address="0x00009888" value="0x18204000" />
+        <register type="NOA" address="0x00009888" value="0x1A200010" />
+        <register type="NOA" address="0x00009888" value="0x10218000" />
+        <register type="NOA" address="0x00009888" value="0x1E2100E0" />
+        <register type="NOA" address="0x00009888" value="0x002900C7" />
+        <register type="NOA" address="0x00009888" value="0x0629CF00" />
+        <register type="NOA" address="0x00009888" value="0x10290000" />
+        <register type="NOA" address="0x00009888" value="0x002A4000" />
+        <register type="NOA" address="0x00009888" value="0x0E2A4000" />
+        <register type="NOA" address="0x00009888" value="0x182A0F00" />
+        <register type="NOA" address="0x00009888" value="0x002C4000" />
+        <register type="NOA" address="0x00009888" value="0x0E2C4000" />
+        <register type="NOA" address="0x00009888" value="0x182C0005" />
+        <register type="NOA" address="0x00009888" value="0x082ECFC7" />
+        <register type="NOA" address="0x00009888" value="0x102E0000" />
+        <register type="NOA" address="0x00009888" value="0x1A2F0005" />
+        <register type="NOA" address="0x00009888" value="0x1E5E000F" />
+        <register type="NOA" address="0x00009888" value="0x1A601540" />
+        <register type="NOA" address="0x00009888" value="0x1E610F00" />
+        <register type="NOA" address="0x00009888" value="0x0A69CFC7" />
+        <register type="NOA" address="0x00009888" value="0x10690000" />
+        <register type="NOA" address="0x00009888" value="0x186A5000" />
+        <register type="NOA" address="0x00009888" value="0x1A6A000F" />
+        <register type="NOA" address="0x00009888" value="0x186C0550" />
+        <register type="NOA" address="0x00009888" value="0x0C6ECFC7" />
+        <register type="NOA" address="0x00009888" value="0x106E0000" />
+        <register type="NOA" address="0x00009888" value="0x1A6F0500" />
+        <register type="NOA" address="0x00009888" value="0x1E9E0030" />
+        <register type="NOA" address="0x00009888" value="0x129E8000" />
+        <register type="NOA" address="0x00009888" value="0x149E8000" />
+        <register type="NOA" address="0x00009888" value="0x1AA04000" />
+        <register type="NOA" address="0x00009888" value="0x1CA00001" />
+        <register type="NOA" address="0x00009888" value="0x02A04000" />
+        <register type="NOA" address="0x00009888" value="0x04A04000" />
+        <register type="NOA" address="0x00009888" value="0x1EA13000" />
+        <register type="NOA" address="0x00009888" value="0x12A18000" />
+        <register type="NOA" address="0x00009888" value="0x14A18000" />
+        <register type="NOA" address="0x00009888" value="0x0EA9CFC7" />
+        <register type="NOA" address="0x00009888" value="0x10A90000" />
+        <register type="NOA" address="0x00009888" value="0x1AAA0050" />
+        <register type="NOA" address="0x00009888" value="0x02AAC000" />
+        <register type="NOA" address="0x00009888" value="0x04AAC000" />
+        <register type="NOA" address="0x00009888" value="0x18AC5000" />
+        <register type="NOA" address="0x00009888" value="0x02AC4000" />
+        <register type="NOA" address="0x00009888" value="0x04AC4000" />
+        <register type="NOA" address="0x00009888" value="0x00AEC700" />
+        <register type="NOA" address="0x00009888" value="0x02AE00CF" />
+        <register type="NOA" address="0x00009888" value="0x10AE0000" />
+        <register type="NOA" address="0x00009888" value="0x02AF4000" />
+        <register type="NOA" address="0x00009888" value="0x04AF4000" />
+        <register type="NOA" address="0x00009888" value="0x16DE8000" />
+        <register type="NOA" address="0x00009888" value="0x18DE8000" />
+        <register type="NOA" address="0x00009888" value="0x1CDE1800" />
+        <register type="NOA" address="0x00009888" value="0x06E04000" />
+        <register type="NOA" address="0x00009888" value="0x08E04000" />
+        <register type="NOA" address="0x00009888" value="0x0AE04000" />
+        <register type="NOA" address="0x00009888" value="0x0CE04000" />
+        <register type="NOA" address="0x00009888" value="0x16E18000" />
+        <register type="NOA" address="0x00009888" value="0x18E18000" />
+        <register type="NOA" address="0x00009888" value="0x1EE10018" />
+        <register type="NOA" address="0x00009888" value="0x02E9C700" />
+        <register type="NOA" address="0x00009888" value="0x04E900CF" />
+        <register type="NOA" address="0x00009888" value="0x10E90000" />
+        <register type="NOA" address="0x00009888" value="0x06EA4000" />
+        <register type="NOA" address="0x00009888" value="0x08EA4000" />
+        <register type="NOA" address="0x00009888" value="0x0AEAC000" />
+        <register type="NOA" address="0x00009888" value="0x0CEAC000" />
+        <register type="NOA" address="0x00009888" value="0x06EC4000" />
+        <register type="NOA" address="0x00009888" value="0x08EC4000" />
+        <register type="NOA" address="0x00009888" value="0x0AEC4000" />
+        <register type="NOA" address="0x00009888" value="0x0CEC4000" />
+        <register type="NOA" address="0x00009888" value="0x04EEC700" />
+        <register type="NOA" address="0x00009888" value="0x06EE00CF" />
+        <register type="NOA" address="0x00009888" value="0x10EE0000" />
+        <register type="NOA" address="0x00009888" value="0x0AEF4000" />
+        <register type="NOA" address="0x00009888" value="0x0CEF4000" />
+        <register type="NOA" address="0x00009888" value="0x0C045400" />
+        <register type="NOA" address="0x00009888" value="0x0E045555" />
+        <register type="NOA" address="0x00009888" value="0x10040155" />
+        <register type="NOA" address="0x00009888" value="0x04055000" />
+        <register type="NOA" address="0x00009888" value="0x0A055000" />
+        <register type="NOA" address="0x00009888" value="0x0C055000" />
+        <register type="NOA" address="0x00009888" value="0x0E055000" />
+        <register type="NOA" address="0x00009888" value="0x14050055" />
+        <register type="NOA" address="0x00009888" value="0x06055000" />
+        <register type="NOA" address="0x00009888" value="0x08055000" />
+        <register type="NOA" address="0x00009888" value="0x2406FF00" />
+        <register type="NOA" address="0x00009888" value="0x260600FF" />
+        <register type="NOA" address="0x00009888" value="0x0A08A000" />
+        <register type="NOA" address="0x00009888" value="0x0C08A000" />
+        <register type="NOA" address="0x00009888" value="0x0E095000" />
+        <register type="NOA" address="0x00009888" value="0x14090005" />
+        <register type="NOA" address="0x00009888" value="0x020D8000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x060E4000" />
+        <register type="NOA" address="0x00009888" value="0x080E5000" />
+        <register type="NOA" address="0x00009888" value="0x0A0E1000" />
+        <register type="NOA" address="0x00009888" value="0x1812A800" />
+        <register type="NOA" address="0x00009888" value="0x1A12003E" />
+        <register type="NOA" address="0x00009888" value="0x0212C000" />
+        <register type="NOA" address="0x00009888" value="0x0412C000" />
+        <register type="NOA" address="0x00009888" value="0x0813C000" />
+        <register type="NOA" address="0x00009888" value="0x0A13F000" />
+        <register type="NOA" address="0x00009888" value="0x04136000" />
+        <register type="NOA" address="0x00009888" value="0x0A14C000" />
+        <register type="NOA" address="0x00009888" value="0x0C14C000" />
+        <register type="NOA" address="0x00009888" value="0x0E14C000" />
+        <register type="NOA" address="0x00009888" value="0x00148000" />
+        <register type="NOA" address="0x00009888" value="0x02144000" />
+        <register type="NOA" address="0x00009888" value="0x0015C000" />
+        <register type="NOA" address="0x00009888" value="0x0E15C000" />
+        <register type="NOA" address="0x00009888" value="0x16152AF8" />
+        <register type="NOA" address="0x00009888" value="0x18150005" />
+        <register type="NOA" address="0x00009888" value="0x02154000" />
+        <register type="NOA" address="0x00009888" value="0x04154000" />
+        <register type="NOA" address="0x00009888" value="0x06158000" />
+        <register type="NOA" address="0x00009888" value="0x08158000" />
+        <register type="NOA" address="0x00009888" value="0x0A158000" />
+        <register type="NOA" address="0x00009888" value="0x0C158000" />
+        <register type="NOA" address="0x00009888" value="0x00182000" />
+        <register type="NOA" address="0x00009888" value="0x06188000" />
+        <register type="NOA" address="0x00009888" value="0x0818A000" />
+        <register type="NOA" address="0x00009888" value="0x08192000" />
+        <register type="NOA" address="0x00009888" value="0x0E198000" />
+        <register type="NOA" address="0x00009888" value="0x12190140" />
+        <register type="NOA" address="0x00009888" value="0x0E1CA000" />
+        <register type="NOA" address="0x00009888" value="0x001C8000" />
+        <register type="NOA" address="0x00009888" value="0x021C2000" />
+        <register type="NOA" address="0x00009888" value="0x141D0028" />
+        <register type="NOA" address="0x00009888" value="0x081D8000" />
+        <register type="NOA" address="0x00009888" value="0x0A1D2000" />
+        <register type="NOA" address="0x00009884" value="0x00000003" />
+        <register type="NOA" address="0x00009888" value="0x301F8000" />
+        <register type="NOA" address="0x00009888" value="0x501F4924" />
+        <register type="NOA" address="0x00009888" value="0x521F4924" />
+        <register type="NOA" address="0x00009888" value="0x541F0024" />
+        <register type="NOA" address="0x00009888" value="0x3A1F8000" />
+        <register type="NOA" address="0x00009888" value="0x4E1F2410" />
+        <register type="NOA" address="0x00009888" value="0x3E1F4000" />
+        <register type="NOA" address="0x00009888" value="0x461F3040" />
+        <register type="NOA" address="0x00009888" value="0x481F1030" />
+        <register type="NOA" address="0x00009888" value="0x4A1F0010" />
+        <register type="NOA" address="0x00009888" value="0x4C1F1000" />
+        <register type="NOA" address="0x00009888" value="0x141F0000" />
+        <register type="NOA" address="0x00009888" value="0x401F0000" />
+        <register type="NOA" address="0x00009888" value="0x421F4040" />
+        <register type="NOA" address="0x00009888" value="0x441F3030" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+    </register_config>
+  </set>
+
+  <set name="Gpu Rings Busyness"
+       mdapi_supported_apis="VK OGL OCL MEDIA IO BB"
+       underscore_name="gpu_busyness"
+       hw_config_guid="c3103887-8c7c-482a-b923-3d68dd340598"
+       chipset="LKF"
+       symbol_name="GpuBusyness"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="Vebox Ring Busy"
+             description="The percentage of time when vebox command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vebox_busy"
+             units="percent"
+             symbol_name="VeboxBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Render Ring Busy"
+             description="The percentage of time when render command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="render_busy"
+             units="percent"
+             symbol_name="RenderBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Vdbox0 Ring Busy"
+             description="The percentage of time when Vdbox0 command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vdbox0_busy"
+             units="percent"
+             symbol_name="Vdbox0Busy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Posh Ring Busy"
+             description="The percentage of time when posh command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="posh_engine_busy"
+             units="percent"
+             symbol_name="PoshEngineBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Blitter Ring Busy"
+             description="The percentage of time when blitter command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="blitter_busy"
+             units="percent"
+             symbol_name="BlitterBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Vdbox1 Ring Busy"
+             description="The percentage of time when Vdbox1 command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vdbox1_busy"
+             units="percent"
+             symbol_name="Vdbox1Busy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="AnyRingBusy"
+             description="The percentage of time when any command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="any_ring_busy"
+             units="percent"
+             symbol_name="AnyRingBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009840" value="0x00000000" />
+        <register type="NOA" address="0x00009884" value="0x00000003" />
+        <register type="NOA" address="0x00009888" value="0x12021200" />
+        <register type="NOA" address="0x00009888" value="0x14040120" />
+        <register type="NOA" address="0x00009888" value="0x10002400" />
+        <register type="NOA" address="0x00009888" value="0x02020083" />
+        <register type="NOA" address="0x00009888" value="0x10020000" />
+        <register type="NOA" address="0x00009888" value="0x00020000" />
+        <register type="NOA" address="0x00009888" value="0x06040043" />
+        <register type="NOA" address="0x00009888" value="0x10040000" />
+        <register type="NOA" address="0x00009888" value="0x1C040004" />
+        <register type="NOA" address="0x00009888" value="0x02000023" />
+        <register type="NOA" address="0x00009888" value="0x22000000" />
+        <register type="NOA" address="0x00009888" value="0x14000000" />
+        <register type="NOA" address="0x00009888" value="0x18008000" />
+        <register type="NOA" address="0x00009888" value="0x04194000" />
+        <register type="NOA" address="0x00009888" value="0x081A8000" />
+        <register type="NOA" address="0x00009888" value="0x3A1F6000" />
+        <register type="NOA" address="0x00009888" value="0x4E1F2900" />
+        <register type="NOA" address="0x00009888" value="0x501F00E9" />
+        <register type="NOA" address="0x00009888" value="0x04218000" />
+        <register type="NOA" address="0x00009888" value="0x06212000" />
+        <register type="NOA" address="0x00009888" value="0x141F0000" />
+        <register type="NOA" address="0x00009888" value="0x401F0160" />
+        <register type="NOA" address="0x00009888" value="0x421F0050" />
+        <register type="NOA" address="0x00009888" value="0x441F0100" />
+        <register type="NOA" address="0x00009888" value="0x301F0000" />
+        <register type="NOA" address="0x00009884" value="0x00000002" />
+        <register type="NOA" address="0x00009888" value="0x181B2400" />
+        <register type="NOA" address="0x00009888" value="0x185B2400" />
+        <register type="NOA" address="0x00009888" value="0x14231200" />
+        <register type="NOA" address="0x00009888" value="0x06218000" />
+        <register type="NOA" address="0x00009888" value="0x08212000" />
+        <register type="NOA" address="0x00009888" value="0x080D8000" />
+        <register type="NOA" address="0x00009888" value="0x040F4000" />
+        <register type="NOA" address="0x00009888" value="0x0828C000" />
+        <register type="NOA" address="0x00009888" value="0x041B8300" />
+        <register type="NOA" address="0x00009888" value="0x221B0000" />
+        <register type="NOA" address="0x00009888" value="0x1A1B0000" />
+        <register type="NOA" address="0x00009888" value="0x22162000" />
+        <register type="NOA" address="0x00009888" value="0x084D4000" />
+        <register type="NOA" address="0x00009888" value="0x044F1000" />
+        <register type="NOA" address="0x00009888" value="0x08683000" />
+        <register type="NOA" address="0x00009888" value="0x045B0083" />
+        <register type="NOA" address="0x00009888" value="0x225B0000" />
+        <register type="NOA" address="0x00009888" value="0x22560800" />
+        <register type="NOA" address="0x00009888" value="0x06230093" />
+        <register type="NOA" address="0x00009888" value="0x20230000" />
+        <register type="NOA" address="0x00009888" value="0x0A238000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x10800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x0007C000" />
+        <register type="OA" address="0x00002774" value="0x000007FF" />
+    </register_config>
+  </set>
+
+  <set name="Metric set TestOa"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="test_oa"
+       hw_config_guid="82b6b321-f93e-445a-a285-f30391ef1dc5"
+       chipset="LKF"
+       symbol_name="TestOa"
+       >
+    <counter name="TestCounter7"
+             description="HW test counter 7. Factor: 0.6666"
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="counter7"
+             units="events"
+             symbol_name="Counter7"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="TestCounter8"
+             description="HW test counter 8. Should be equal to 1."
+             data_type="uint64"
+             equation="C 0 READ"
+             underscore_name="counter8"
+             units="events"
+             symbol_name="Counter8"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter4"
+             description="HW test counter 4. Factor: 0.3333"
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="counter4"
+             units="events"
+             symbol_name="Counter4"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter5"
+             description="HW test counter 5. Factor: 0.3333"
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="counter5"
+             units="events"
+             symbol_name="Counter5"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter6"
+             description="HW test counter 6. Factor: 0.16666"
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="counter6"
+             units="events"
+             symbol_name="Counter6"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter3"
+             description="HW test counter 3. Factor: 0.5"
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="counter3"
+             units="events"
+             symbol_name="Counter3"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter0"
+             description="HW test counter 0. Factor: 0.0"
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="counter0"
+             units="events"
+             symbol_name="Counter0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter1"
+             description="HW test counter 1. Factor: 1.0"
+             data_type="uint64"
+             equation="B 1 READ"
+             underscore_name="counter1"
+             units="events"
+             symbol_name="Counter1"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter2"
+             description="HW test counter 2. Factor: 1.0"
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="counter2"
+             units="events"
+             symbol_name="Counter2"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009840" value="0x00000000" />
+        <register type="NOA" address="0x00009884" value="0x00000003" />
+        <register type="NOA" address="0x00009888" value="0x18130000" />
+        <register type="NOA" address="0x00009888" value="0x22000004" />
+        <register type="NOA" address="0x00009888" value="0x0E130076" />
+        <register type="NOA" address="0x00009888" value="0x10130000" />
+        <register type="NOA" address="0x00009888" value="0x1E130000" />
+        <register type="NOA" address="0x00009888" value="0x0E164000" />
+        <register type="NOA" address="0x00009888" value="0x1A1A0004" />
+        <register type="NOA" address="0x00009888" value="0x541F0001" />
+        <register type="NOA" address="0x00009888" value="0x141F0000" />
+        <register type="NOA" address="0x00009888" value="0x4C1F0000" />
+        <register type="NOA" address="0x00009888" value="0x301F0000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002770" value="0x00000004" />
+        <register type="OA" address="0x00002774" value="0x0000FFFF" />
+        <register type="OA" address="0x00002778" value="0x00000003" />
+        <register type="OA" address="0x0000277C" value="0x0000FFFF" />
+        <register type="OA" address="0x00002780" value="0x00000007" />
+        <register type="OA" address="0x00002784" value="0x0000FFFF" />
+        <register type="OA" address="0x00002788" value="0x00100002" />
+        <register type="OA" address="0x0000278C" value="0x0000FFF7" />
+        <register type="OA" address="0x00002790" value="0x00100002" />
+        <register type="OA" address="0x00002794" value="0x0000FFCF" />
+        <register type="OA" address="0x00002798" value="0x00100082" />
+        <register type="OA" address="0x0000279C" value="0x0000FFEF" />
+        <register type="OA" address="0x000027A0" value="0x001000C2" />
+        <register type="OA" address="0x000027A4" value="0x0000FFE7" />
+        <register type="OA" address="0x000027A8" value="0x00100001" />
+        <register type="OA" address="0x000027AC" value="0x0000FFE7" />
+    </register_config>
+  </set>
+
+</metrics>
diff --git a/lib/i915/perf-configs/oa-sklgt2.xml b/lib/i915/perf-configs/oa-sklgt2.xml
new file mode 100644
index 00000000..cad7d139
--- /dev/null
+++ b/lib/i915/perf-configs/oa-sklgt2.xml
@@ -0,0 +1,11895 @@
+<?xml version="1.0"?>
+<metrics version="1581935518" merge_md5="">
+  <set name="Render Metrics Basic Gen9"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="render_basic"
+       hw_config_guid="07b25942-d9fd-4fce-bd58-e29abd66b7de"
+       chipset="SKLGT2"
+       symbol_name="RenderBasic"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Misses"
+             description="The total number of L3 misses."
+             data_type="uint64"
+             equation="C 4 READ"
+             underscore_name="l3_misses"
+             units="messages"
+             symbol_name="L3Misses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/TAG"
+             />
+    <counter name="GTI L3 Throughput"
+             description="The total number of GPU memory bytes transferred between L3 caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="$L3Misses 64 UMUL"
+             underscore_name="gti_l3_throughput"
+             units="bytes"
+             symbol_name="GtiL3Throughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Cache Misses"
+             description="The total number of sampler cache misses in all LODs in all sampler units."
+             data_type="uint64"
+             equation="B 4 READ 8 UMUL"
+             underscore_name="sampler_l1_misses"
+             units="messages"
+             symbol_name="SamplerL1Misses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler 1 Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which Sampler 1 has been slowing down the pipe when processing EU requests."
+             data_type="float"
+             high_watermark="15"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="sampler1_bottleneck"
+             units="percent"
+             symbol_name="Sampler1Bottleneck"
+             availability="$SubsliceMask 0x12 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="L3 Sampler Throughput"
+             description="The total number of GPU memory bytes transferred between samplers and L3 caches."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="$SamplerL1Misses 64 UMUL"
+             underscore_name="l3_sampler_throughput"
+             units="bytes"
+             symbol_name="L3SamplerThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Sampler"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Sampler 0 Busy"
+             description="The percentage of time in which Sampler 0 has been processing EU requests."
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler0_busy"
+             units="percent"
+             symbol_name="Sampler0Busy"
+             availability="$SubsliceMask 0x09 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Sampler 1 Busy"
+             description="The percentage of time in which Sampler 1 has been processing EU requests."
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler1_busy"
+             units="percent"
+             symbol_name="Sampler1Busy"
+             availability="$SubsliceMask 0x12 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Samplers Busy"
+             description="The percentage of time in which samplers have been processing EU requests."
+             data_type="float"
+             max_equation="100"
+             equation="$Sampler0Busy $Sampler1Busy FMAX"
+             underscore_name="samplers_busy"
+             units="percent"
+             symbol_name="SamplersBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="GTI Fixed Pipe Throughput"
+             description="The total number of GPU memory bytes transferred between 3D Pipeline (Command Dispatch, Input Assembly and Stream Output) and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="B 6 READ B 7 READ UADD 64 UMUL"
+             underscore_name="gti_vf_throughput"
+             units="bytes"
+             symbol_name="GtiVfThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/3D Pipe"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler 0 Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which Sampler 0 has been slowing down the pipe when processing EU requests."
+             data_type="float"
+             high_watermark="15"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="sampler0_bottleneck"
+             units="percent"
+             symbol_name="Sampler0Bottleneck"
+             availability="$SubsliceMask 0x09 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="L3 Lookup Accesses w/o IC"
+             description="The total number of L3 cache lookup accesses w/o IC."
+             data_type="uint64"
+             equation="$SamplerL1Misses $ShaderMemoryAccesses UADD"
+             underscore_name="l3_lookups"
+             units="messages"
+             symbol_name="L3Lookups"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/TAG"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Read Throughput"
+             description="The total number of GPU memory bytes read from GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="C 6 READ 64 UMUL"
+             underscore_name="gti_read_throughput"
+             units="bytes"
+             symbol_name="GtiReadThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Depth Throughput"
+             description="The total number of GPU memory bytes transferred between depth caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 0 READ C 1 READ UADD 64 UMUL"
+             underscore_name="gti_depth_throughput"
+             units="bytes"
+             symbol_name="GtiDepthThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/Depth Cache"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Samplers Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which samplers have been slowing down the pipe when processing EU requests."
+             data_type="float"
+             high_watermark="15"
+             equation="$Sampler0Bottleneck $Sampler1Bottleneck FMAX"
+             max_equation="100"
+             underscore_name="sampler_bottleneck"
+             units="percent"
+             symbol_name="SamplerBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Indicate System Frame Batch Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="GTI HDC TLB Lookup Throughput"
+             description="The total number of GPU memory bytes transferred between GTI and HDC, when HDC is doing TLB lookups."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 5 READ 64 UMUL"
+             underscore_name="gti_hdc_lookups_throughput"
+             units="bytes"
+             symbol_name="GtiHdcLookupsThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI RCC Throughput"
+             description="The total number of GPU memory bytes transferred between render color caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 2 READ C 3 READ UADD 64 UMUL"
+             underscore_name="gti_rcc_throughput"
+             units="bytes"
+             symbol_name="GtiRccThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/Color Cache"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="GTI Write Throughput"
+             description="The total number of GPU memory bytes written to GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 32 UMUL"
+             equation="C 7 READ 64 UMUL"
+             underscore_name="gti_write_throughput"
+             units="bytes"
+             symbol_name="GtiWriteThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA"
+                     availability="$SkuRevisionId 0x02 UGTE"
+                     priority="0"
+                     >
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x166C01E0" />
+        <register type="NOA" address="0x00009888" value="0x12170280" />
+        <register type="NOA" address="0x00009888" value="0x12370280" />
+        <register type="NOA" address="0x00009888" value="0x11930317" />
+        <register type="NOA" address="0x00009888" value="0x159303DF" />
+        <register type="NOA" address="0x00009888" value="0x3F900003" />
+        <register type="NOA" address="0x00009888" value="0x1A4E0080" />
+        <register type="NOA" address="0x00009888" value="0x0A6C0053" />
+        <register type="NOA" address="0x00009888" value="0x106C0000" />
+        <register type="NOA" address="0x00009888" value="0x1C6C0000" />
+        <register type="NOA" address="0x00009888" value="0x0A1B4000" />
+        <register type="NOA" address="0x00009888" value="0x1C1C0001" />
+        <register type="NOA" address="0x00009888" value="0x002F1000" />
+        <register type="NOA" address="0x00009888" value="0x042F1000" />
+        <register type="NOA" address="0x00009888" value="0x004C4000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C8400" />
+        <register type="NOA" address="0x00009888" value="0x000D2000" />
+        <register type="NOA" address="0x00009888" value="0x060D8000" />
+        <register type="NOA" address="0x00009888" value="0x080DA000" />
+        <register type="NOA" address="0x00009888" value="0x0A0D2000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F0400" />
+        <register type="NOA" address="0x00009888" value="0x0E0F6600" />
+        <register type="NOA" address="0x00009888" value="0x002C8000" />
+        <register type="NOA" address="0x00009888" value="0x162C2200" />
+        <register type="NOA" address="0x00009888" value="0x062D8000" />
+        <register type="NOA" address="0x00009888" value="0x082D8000" />
+        <register type="NOA" address="0x00009888" value="0x00133000" />
+        <register type="NOA" address="0x00009888" value="0x08133000" />
+        <register type="NOA" address="0x00009888" value="0x00170020" />
+        <register type="NOA" address="0x00009888" value="0x08170021" />
+        <register type="NOA" address="0x00009888" value="0x10170000" />
+        <register type="NOA" address="0x00009888" value="0x0633C000" />
+        <register type="NOA" address="0x00009888" value="0x0833C000" />
+        <register type="NOA" address="0x00009888" value="0x06370800" />
+        <register type="NOA" address="0x00009888" value="0x08370840" />
+        <register type="NOA" address="0x00009888" value="0x10370000" />
+        <register type="NOA" address="0x00009888" value="0x0D933031" />
+        <register type="NOA" address="0x00009888" value="0x0F933E3F" />
+        <register type="NOA" address="0x00009888" value="0x01933D00" />
+        <register type="NOA" address="0x00009888" value="0x0393073C" />
+        <register type="NOA" address="0x00009888" value="0x0593000E" />
+        <register type="NOA" address="0x00009888" value="0x1D930000" />
+        <register type="NOA" address="0x00009888" value="0x19930000" />
+        <register type="NOA" address="0x00009888" value="0x1B930000" />
+        <register type="NOA" address="0x00009888" value="0x1D900157" />
+        <register type="NOA" address="0x00009888" value="0x1F900158" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x2B908000" />
+        <register type="NOA" address="0x00009888" value="0x2D908000" />
+        <register type="NOA" address="0x00009888" value="0x2F908000" />
+        <register type="NOA" address="0x00009888" value="0x31908000" />
+        <register type="NOA" address="0x00009888" value="0x15908000" />
+        <register type="NOA" address="0x00009888" value="0x17908000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B908000" />
+        <register type="NOA" address="0x00009888" value="0x1190001F" />
+        <register type="NOA" address="0x00009888" value="0x51904400" />
+        <register type="NOA" address="0x00009888" value="0x41900020" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900C21" />
+        <register type="NOA" address="0x00009888" value="0x47900061" />
+        <register type="NOA" address="0x00009888" value="0x57904440" />
+        <register type="NOA" address="0x00009888" value="0x49900000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900000" />
+        <register type="NOA" address="0x00009888" value="0x59900004" />
+        <register type="NOA" address="0x00009888" value="0x43900000" />
+        <register type="NOA" address="0x00009888" value="0x53904444" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00222222" />
+    </register_config>
+  </set>
+
+  <set name="Compute Metrics Basic Gen9"
+       mdapi_supported_apis="VK OGL4 OCL IO BB"
+       underscore_name="compute_basic"
+       hw_config_guid="00b80b4c-d215-4378-9015-da3dda3b61ea"
+       chipset="SKLGT2"
+       symbol_name="ComputeBasic"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Untyped Bytes Read"
+             description="The total number of typed memory bytes read via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="B 6 READ B 7 READ C 0 READ UADD UADD $EuSlicesTotalCount 64 UMUL UMUL"
+             underscore_name="untyped_bytes_read"
+             units="bytes"
+             symbol_name="UntypedBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Typed Bytes Written"
+             description="The total number of untyped memory bytes written via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="B 3 READ B 4 READ B 5 READ UADD UADD $EuSlicesTotalCount 64 UMUL UMUL"
+             underscore_name="typed_bytes_written"
+             units="bytes"
+             symbol_name="TypedBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu0_active"
+             units="percent"
+             symbol_name="Fpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active"
+             units="percent"
+             symbol_name="Fpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO OCL BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU AVG IPC Rate"
+             description="The average rate of IPC calculated for 2 FPU pipelines."
+             data_type="float"
+             max_equation="2"
+             equation="A 9 READ  A 10 READ  A 11 READ UADD  A 9 READ USUB FDIV 1 FADD"
+             underscore_name="eu_avg_ipc_rate"
+             units="number"
+             symbol_name="EuAvgIpcRate"
+             semantic_type="ratio"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO OCL BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO OCL BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Read Throughput"
+             description="The total number of GPU memory bytes read from GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 4 READ 64 UMUL"
+             underscore_name="gti_read_throughput"
+             units="bytes"
+             symbol_name="GtiReadThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Untyped Writes"
+             description="The total number of untyped memory bytes written via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 1 READ C 2 READ C 3 READ UADD UADD $EuSlicesTotalCount 64 UMUL UMUL"
+             underscore_name="untyped_bytes_written"
+             units="bytes"
+             symbol_name="UntypedBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO OCL BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="Typed Bytes Read"
+             description="The total number of typed memory bytes read via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="B 0 READ B 1 READ B 2 READ UADD UADD $EuSlicesTotalCount 64 UMUL UMUL"
+             underscore_name="typed_bytes_read"
+             units="bytes"
+             symbol_name="TypedBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="EU Thread Occupancy"
+             description="The percentage of time in which hardware threads occupied EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ 8 UMUL $EuCoresTotalCount UDIV $EuThreadsCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_thread_occupancy"
+             units="percent"
+             symbol_name="EuThreadOccupancy"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO OCL BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO OCL BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO OCL BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="GTI Write Throughput"
+             description="The total number of GPU memory bytes written to GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 32 UMUL"
+             equation="C 5 READ 64 UMUL"
+             underscore_name="gti_write_throughput"
+             units="bytes"
+             symbol_name="GtiWriteThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO OCL BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO OCL BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="EU Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_send_active"
+             units="percent"
+             symbol_name="EuSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO OCL BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA"
+                     availability="$SliceMask 0x01 AND $SkuRevisionId 0x02 ULT &&"
+                     priority="0"
+                     >
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x104F00E0" />
+        <register type="NOA" address="0x00009888" value="0x124F1C00" />
+        <register type="NOA" address="0x00009888" value="0x106C00E0" />
+        <register type="NOA" address="0x00009888" value="0x37906800" />
+        <register type="NOA" address="0x00009888" value="0x3F901403" />
+        <register type="NOA" address="0x00009888" value="0x184E8000" />
+        <register type="NOA" address="0x00009888" value="0x1A4E8200" />
+        <register type="NOA" address="0x00009888" value="0x044E8000" />
+        <register type="NOA" address="0x00009888" value="0x004F0DB2" />
+        <register type="NOA" address="0x00009888" value="0x064F0900" />
+        <register type="NOA" address="0x00009888" value="0x084F1880" />
+        <register type="NOA" address="0x00009888" value="0x0A4F0011" />
+        <register type="NOA" address="0x00009888" value="0x0C4F0E3C" />
+        <register type="NOA" address="0x00009888" value="0x0E4F1D80" />
+        <register type="NOA" address="0x00009888" value="0x086C0002" />
+        <register type="NOA" address="0x00009888" value="0x0A6C0100" />
+        <register type="NOA" address="0x00009888" value="0x0E6C000C" />
+        <register type="NOA" address="0x00009888" value="0x026C000B" />
+        <register type="NOA" address="0x00009888" value="0x1C6C0000" />
+        <register type="NOA" address="0x00009888" value="0x1A6C0000" />
+        <register type="NOA" address="0x00009888" value="0x081B4000" />
+        <register type="NOA" address="0x00009888" value="0x0A1B8000" />
+        <register type="NOA" address="0x00009888" value="0x0E1B4000" />
+        <register type="NOA" address="0x00009888" value="0x021B4000" />
+        <register type="NOA" address="0x00009888" value="0x1A1C4000" />
+        <register type="NOA" address="0x00009888" value="0x1C1C0012" />
+        <register type="NOA" address="0x00009888" value="0x141C8000" />
+        <register type="NOA" address="0x00009888" value="0x005BC000" />
+        <register type="NOA" address="0x00009888" value="0x065B8000" />
+        <register type="NOA" address="0x00009888" value="0x085B8000" />
+        <register type="NOA" address="0x00009888" value="0x0A5B4000" />
+        <register type="NOA" address="0x00009888" value="0x0C5BC000" />
+        <register type="NOA" address="0x00009888" value="0x0E5B8000" />
+        <register type="NOA" address="0x00009888" value="0x105C8000" />
+        <register type="NOA" address="0x00009888" value="0x1A5CA000" />
+        <register type="NOA" address="0x00009888" value="0x1C5C002D" />
+        <register type="NOA" address="0x00009888" value="0x125C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C0800" />
+        <register type="NOA" address="0x00009888" value="0x0C4C0082" />
+        <register type="NOA" address="0x00009888" value="0x084C8000" />
+        <register type="NOA" address="0x00009888" value="0x000DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D8000" />
+        <register type="NOA" address="0x00009888" value="0x080DA000" />
+        <register type="NOA" address="0x00009888" value="0x0A0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0E0DA000" />
+        <register type="NOA" address="0x00009888" value="0x020D2000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F5400" />
+        <register type="NOA" address="0x00009888" value="0x0E0F5500" />
+        <register type="NOA" address="0x00009888" value="0x100F0155" />
+        <register type="NOA" address="0x00009888" value="0x002CC000" />
+        <register type="NOA" address="0x00009888" value="0x0E2CC000" />
+        <register type="NOA" address="0x00009888" value="0x162CBE00" />
+        <register type="NOA" address="0x00009888" value="0x182C00EF" />
+        <register type="NOA" address="0x00009888" value="0x022CC000" />
+        <register type="NOA" address="0x00009888" value="0x042C8000" />
+        <register type="NOA" address="0x00009888" value="0x19900157" />
+        <register type="NOA" address="0x00009888" value="0x1B900167" />
+        <register type="NOA" address="0x00009888" value="0x1D900105" />
+        <register type="NOA" address="0x00009888" value="0x1F900103" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x11900FFF" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900840" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900842" />
+        <register type="NOA" address="0x00009888" value="0x47900840" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900840" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900040" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x43900840" />
+        <register type="NOA" address="0x00009888" value="0x53901111" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+    </register_config>
+    <register_config type="NOA"
+                     availability="$SliceMask 0x01 AND $SkuRevisionId 0x02 UGTE &&"
+                     priority="0"
+                     >
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x104F00E0" />
+        <register type="NOA" address="0x00009888" value="0x124F1C00" />
+        <register type="NOA" address="0x00009888" value="0x106C00E0" />
+        <register type="NOA" address="0x00009888" value="0x37906800" />
+        <register type="NOA" address="0x00009888" value="0x3F901403" />
+        <register type="NOA" address="0x00009888" value="0x004E8000" />
+        <register type="NOA" address="0x00009888" value="0x1A4E0820" />
+        <register type="NOA" address="0x00009888" value="0x1C4E0002" />
+        <register type="NOA" address="0x00009888" value="0x064F0900" />
+        <register type="NOA" address="0x00009888" value="0x084F0032" />
+        <register type="NOA" address="0x00009888" value="0x0A4F1810" />
+        <register type="NOA" address="0x00009888" value="0x0C4F0E00" />
+        <register type="NOA" address="0x00009888" value="0x0E4F003C" />
+        <register type="NOA" address="0x00009888" value="0x004F0D80" />
+        <register type="NOA" address="0x00009888" value="0x024F003B" />
+        <register type="NOA" address="0x00009888" value="0x006C0002" />
+        <register type="NOA" address="0x00009888" value="0x086C0000" />
+        <register type="NOA" address="0x00009888" value="0x0C6C000C" />
+        <register type="NOA" address="0x00009888" value="0x0E6C0B00" />
+        <register type="NOA" address="0x00009888" value="0x186C0000" />
+        <register type="NOA" address="0x00009888" value="0x1C6C0000" />
+        <register type="NOA" address="0x00009888" value="0x1E6C0000" />
+        <register type="NOA" address="0x00009888" value="0x001B4000" />
+        <register type="NOA" address="0x00009888" value="0x081B8000" />
+        <register type="NOA" address="0x00009888" value="0x0C1B4000" />
+        <register type="NOA" address="0x00009888" value="0x0E1B8000" />
+        <register type="NOA" address="0x00009888" value="0x101C8000" />
+        <register type="NOA" address="0x00009888" value="0x1A1C8000" />
+        <register type="NOA" address="0x00009888" value="0x1C1C0024" />
+        <register type="NOA" address="0x00009888" value="0x065B8000" />
+        <register type="NOA" address="0x00009888" value="0x085B4000" />
+        <register type="NOA" address="0x00009888" value="0x0A5BC000" />
+        <register type="NOA" address="0x00009888" value="0x0C5B8000" />
+        <register type="NOA" address="0x00009888" value="0x0E5B4000" />
+        <register type="NOA" address="0x00009888" value="0x005B8000" />
+        <register type="NOA" address="0x00009888" value="0x025B4000" />
+        <register type="NOA" address="0x00009888" value="0x1A5C6000" />
+        <register type="NOA" address="0x00009888" value="0x1C5C001B" />
+        <register type="NOA" address="0x00009888" value="0x125C8000" />
+        <register type="NOA" address="0x00009888" value="0x145C8000" />
+        <register type="NOA" address="0x00009888" value="0x004C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C2000" />
+        <register type="NOA" address="0x00009888" value="0x0C4C0208" />
+        <register type="NOA" address="0x00009888" value="0x000DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D8000" />
+        <register type="NOA" address="0x00009888" value="0x080DA000" />
+        <register type="NOA" address="0x00009888" value="0x0A0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0E0DA000" />
+        <register type="NOA" address="0x00009888" value="0x020D2000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F5400" />
+        <register type="NOA" address="0x00009888" value="0x0E0F5500" />
+        <register type="NOA" address="0x00009888" value="0x100F0155" />
+        <register type="NOA" address="0x00009888" value="0x002C8000" />
+        <register type="NOA" address="0x00009888" value="0x0E2CC000" />
+        <register type="NOA" address="0x00009888" value="0x162CFB00" />
+        <register type="NOA" address="0x00009888" value="0x182C00BE" />
+        <register type="NOA" address="0x00009888" value="0x022CC000" />
+        <register type="NOA" address="0x00009888" value="0x042CC000" />
+        <register type="NOA" address="0x00009888" value="0x19900157" />
+        <register type="NOA" address="0x00009888" value="0x1B900167" />
+        <register type="NOA" address="0x00009888" value="0x1D900105" />
+        <register type="NOA" address="0x00009888" value="0x1F900103" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x11900FFF" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900800" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900842" />
+        <register type="NOA" address="0x00009888" value="0x47900802" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900802" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900002" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x43900842" />
+        <register type="NOA" address="0x00009888" value="0x53901111" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00000003" />
+        <register type="FLEX" address="0x0000E658" value="0x00002001" />
+        <register type="FLEX" address="0x0000E758" value="0x00778008" />
+        <register type="FLEX" address="0x0000E45C" value="0x00088078" />
+        <register type="FLEX" address="0x0000E55C" value="0x00808708" />
+        <register type="FLEX" address="0x0000E65C" value="0x00A08908" />
+    </register_config>
+  </set>
+
+  <set name="Render Metrics for 3D Pipeline Profile Gen9"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="render_pipe_profile"
+       hw_config_guid="2a0c0933-37e7-427c-9951-ded42a78bb27"
+       chipset="SKLGT2"
+       symbol_name="RenderPipeProfile"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Bottleneck"
+             low_watermark="10"
+             description="The percentage of time in which vertex shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="30"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_bottleneck"
+             units="percent"
+             symbol_name="VsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Hi-Depth Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which early hierarchical depth test pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="hi_depth_bottleneck"
+             units="percent"
+             symbol_name="HiDepthBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which geometry shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gs_bottleneck"
+             units="percent"
+             symbol_name="GsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Geometry Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="BC Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which barycentric coordinates calculation pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="bc_bottleneck"
+             units="percent"
+             symbol_name="BcBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Barycentric Calc"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HS Stall"
+             description="The percentage of time in which hull stall pipeline stage was stalled."
+             data_type="float"
+             equation="C 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="hs_stall"
+             units="percent"
+             symbol_name="HsStall"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Hull Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="VF Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which vertex fetch pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="C 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vf_bottleneck"
+             units="percent"
+             symbol_name="VfBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Input Assembler"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Strip-Fans Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which strip-fans pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="10"
+             equation="B 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sf_bottleneck"
+             units="percent"
+             symbol_name="SfBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Strip-Fans"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SF Stall"
+             description="The percentage of time in which strip-fans pipeline stage was stalled."
+             data_type="float"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sf_stall"
+             units="percent"
+             symbol_name="SfStall"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Strip-Fans"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HS Bottleneck"
+             low_watermark="3"
+             description="The percentage of time in which hull shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="9"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="hs_bottleneck"
+             units="percent"
+             symbol_name="HsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Hull Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="CL Stall"
+             description="The percentage of time in which clipper pipeline stage was stalled."
+             data_type="float"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="cl_stall"
+             units="percent"
+             symbol_name="ClStall"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Clipper"
+             />
+    <counter name="SO Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which stream output pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="so_bottleneck"
+             units="percent"
+             symbol_name="SoBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Stream Output"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="DS Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which domain shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ds_bottleneck"
+             units="percent"
+             symbol_name="DsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Domain Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Clipper Bottleneck"
+             low_watermark="10"
+             description="The percentage of time in which clipper pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="30"
+             equation="B 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="cl_bottleneck"
+             units="percent"
+             symbol_name="ClBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Clipper"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Stall"
+             description="The percentage of time in which domain shader pipeline stage was stalled."
+             data_type="float"
+             equation="C 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ds_stall"
+             units="percent"
+             symbol_name="DsStall"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Domain Shader"
+             />
+    <counter name="Early Depth Bottleneck"
+             low_watermark="10"
+             description="The percentage of time in which early depth test pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="30"
+             equation="B 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="early_depth_bottleneck"
+             units="percent"
+             symbol_name="EarlyDepthBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="SO Stall"
+             description="The percentage of time in which stream-output pipeline stage was stalled."
+             data_type="float"
+             equation="C 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="so_stall"
+             units="percent"
+             symbol_name="SoStall"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Stream Output"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA"
+                     availability="$SkuRevisionId 0x02 ULT"
+                     priority="0"
+                     >
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x0C0E001F" />
+        <register type="NOA" address="0x00009888" value="0x0A0F0000" />
+        <register type="NOA" address="0x00009888" value="0x10116800" />
+        <register type="NOA" address="0x00009888" value="0x178A03E0" />
+        <register type="NOA" address="0x00009888" value="0x11824C00" />
+        <register type="NOA" address="0x00009888" value="0x11830020" />
+        <register type="NOA" address="0x00009888" value="0x13840020" />
+        <register type="NOA" address="0x00009888" value="0x11850019" />
+        <register type="NOA" address="0x00009888" value="0x11860007" />
+        <register type="NOA" address="0x00009888" value="0x01870C40" />
+        <register type="NOA" address="0x00009888" value="0x17880000" />
+        <register type="NOA" address="0x00009888" value="0x022F4000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C0040" />
+        <register type="NOA" address="0x00009888" value="0x0C0D8000" />
+        <register type="NOA" address="0x00009888" value="0x040D4000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x020E5400" />
+        <register type="NOA" address="0x00009888" value="0x000E0000" />
+        <register type="NOA" address="0x00009888" value="0x080F0040" />
+        <register type="NOA" address="0x00009888" value="0x000F0000" />
+        <register type="NOA" address="0x00009888" value="0x100F0000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0040" />
+        <register type="NOA" address="0x00009888" value="0x0C2C8000" />
+        <register type="NOA" address="0x00009888" value="0x06104000" />
+        <register type="NOA" address="0x00009888" value="0x06110012" />
+        <register type="NOA" address="0x00009888" value="0x06131000" />
+        <register type="NOA" address="0x00009888" value="0x01898000" />
+        <register type="NOA" address="0x00009888" value="0x0D890100" />
+        <register type="NOA" address="0x00009888" value="0x03898000" />
+        <register type="NOA" address="0x00009888" value="0x09808000" />
+        <register type="NOA" address="0x00009888" value="0x0B808000" />
+        <register type="NOA" address="0x00009888" value="0x0380C000" />
+        <register type="NOA" address="0x00009888" value="0x0F8A0075" />
+        <register type="NOA" address="0x00009888" value="0x1D8A0000" />
+        <register type="NOA" address="0x00009888" value="0x118A8000" />
+        <register type="NOA" address="0x00009888" value="0x1B8A4000" />
+        <register type="NOA" address="0x00009888" value="0x138A8000" />
+        <register type="NOA" address="0x00009888" value="0x1D81A000" />
+        <register type="NOA" address="0x00009888" value="0x15818000" />
+        <register type="NOA" address="0x00009888" value="0x17818000" />
+        <register type="NOA" address="0x00009888" value="0x0B820030" />
+        <register type="NOA" address="0x00009888" value="0x07828000" />
+        <register type="NOA" address="0x00009888" value="0x0D824000" />
+        <register type="NOA" address="0x00009888" value="0x0F828000" />
+        <register type="NOA" address="0x00009888" value="0x05824000" />
+        <register type="NOA" address="0x00009888" value="0x0D830003" />
+        <register type="NOA" address="0x00009888" value="0x0583000C" />
+        <register type="NOA" address="0x00009888" value="0x09830000" />
+        <register type="NOA" address="0x00009888" value="0x03838000" />
+        <register type="NOA" address="0x00009888" value="0x07838000" />
+        <register type="NOA" address="0x00009888" value="0x0B840980" />
+        <register type="NOA" address="0x00009888" value="0x03844D80" />
+        <register type="NOA" address="0x00009888" value="0x11840000" />
+        <register type="NOA" address="0x00009888" value="0x09848000" />
+        <register type="NOA" address="0x00009888" value="0x09850080" />
+        <register type="NOA" address="0x00009888" value="0x03850003" />
+        <register type="NOA" address="0x00009888" value="0x01850000" />
+        <register type="NOA" address="0x00009888" value="0x07860000" />
+        <register type="NOA" address="0x00009888" value="0x0F860400" />
+        <register type="NOA" address="0x00009888" value="0x09870032" />
+        <register type="NOA" address="0x00009888" value="0x01888052" />
+        <register type="NOA" address="0x00009888" value="0x11880000" />
+        <register type="NOA" address="0x00009888" value="0x09884000" />
+        <register type="NOA" address="0x00009888" value="0x15968000" />
+        <register type="NOA" address="0x00009888" value="0x17968000" />
+        <register type="NOA" address="0x00009888" value="0x0F96C000" />
+        <register type="NOA" address="0x00009888" value="0x1F950011" />
+        <register type="NOA" address="0x00009888" value="0x1D950014" />
+        <register type="NOA" address="0x00009888" value="0x0592C000" />
+        <register type="NOA" address="0x00009888" value="0x0B928000" />
+        <register type="NOA" address="0x00009888" value="0x0D924000" />
+        <register type="NOA" address="0x00009888" value="0x0F924000" />
+        <register type="NOA" address="0x00009888" value="0x11928000" />
+        <register type="NOA" address="0x00009888" value="0x1392C000" />
+        <register type="NOA" address="0x00009888" value="0x09924000" />
+        <register type="NOA" address="0x00009888" value="0x01985000" />
+        <register type="NOA" address="0x00009888" value="0x07988000" />
+        <register type="NOA" address="0x00009888" value="0x09981000" />
+        <register type="NOA" address="0x00009888" value="0x0B982000" />
+        <register type="NOA" address="0x00009888" value="0x0D982000" />
+        <register type="NOA" address="0x00009888" value="0x0F989000" />
+        <register type="NOA" address="0x00009888" value="0x05982000" />
+        <register type="NOA" address="0x00009888" value="0x13904000" />
+        <register type="NOA" address="0x00009888" value="0x21904000" />
+        <register type="NOA" address="0x00009888" value="0x23904000" />
+        <register type="NOA" address="0x00009888" value="0x25908000" />
+        <register type="NOA" address="0x00009888" value="0x27904000" />
+        <register type="NOA" address="0x00009888" value="0x29908000" />
+        <register type="NOA" address="0x00009888" value="0x2B904000" />
+        <register type="NOA" address="0x00009888" value="0x2F904000" />
+        <register type="NOA" address="0x00009888" value="0x31904000" />
+        <register type="NOA" address="0x00009888" value="0x15904000" />
+        <register type="NOA" address="0x00009888" value="0x17908000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B904000" />
+        <register type="NOA" address="0x00009888" value="0x0B978000" />
+        <register type="NOA" address="0x00009888" value="0x0F974000" />
+        <register type="NOA" address="0x00009888" value="0x11974000" />
+        <register type="NOA" address="0x00009888" value="0x13978000" />
+        <register type="NOA" address="0x00009888" value="0x09974000" />
+        <register type="NOA" address="0x00009888" value="0x1190C080" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x419010A0" />
+        <register type="NOA" address="0x00009888" value="0x55904000" />
+        <register type="NOA" address="0x00009888" value="0x45901000" />
+        <register type="NOA" address="0x00009888" value="0x47900084" />
+        <register type="NOA" address="0x00009888" value="0x57904400" />
+        <register type="NOA" address="0x00009888" value="0x499000A5" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900081" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x439014A4" />
+        <register type="NOA" address="0x00009888" value="0x53900400" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+    </register_config>
+    <register_config type="NOA"
+                     availability="$SkuRevisionId 0x02 UGTE"
+                     priority="0"
+                     >
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x0C0E001F" />
+        <register type="NOA" address="0x00009888" value="0x0A0F0000" />
+        <register type="NOA" address="0x00009888" value="0x10116800" />
+        <register type="NOA" address="0x00009888" value="0x178A03E0" />
+        <register type="NOA" address="0x00009888" value="0x11824C00" />
+        <register type="NOA" address="0x00009888" value="0x11830020" />
+        <register type="NOA" address="0x00009888" value="0x13840020" />
+        <register type="NOA" address="0x00009888" value="0x11850019" />
+        <register type="NOA" address="0x00009888" value="0x11860007" />
+        <register type="NOA" address="0x00009888" value="0x01870C40" />
+        <register type="NOA" address="0x00009888" value="0x17880000" />
+        <register type="NOA" address="0x00009888" value="0x022F4000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C0040" />
+        <register type="NOA" address="0x00009888" value="0x0C0D8000" />
+        <register type="NOA" address="0x00009888" value="0x040D4000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x020E5400" />
+        <register type="NOA" address="0x00009888" value="0x000E0000" />
+        <register type="NOA" address="0x00009888" value="0x080F0040" />
+        <register type="NOA" address="0x00009888" value="0x000F0000" />
+        <register type="NOA" address="0x00009888" value="0x100F0000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0040" />
+        <register type="NOA" address="0x00009888" value="0x0C2C8000" />
+        <register type="NOA" address="0x00009888" value="0x06104000" />
+        <register type="NOA" address="0x00009888" value="0x06110012" />
+        <register type="NOA" address="0x00009888" value="0x06131000" />
+        <register type="NOA" address="0x00009888" value="0x01898000" />
+        <register type="NOA" address="0x00009888" value="0x0D890100" />
+        <register type="NOA" address="0x00009888" value="0x03898000" />
+        <register type="NOA" address="0x00009888" value="0x09808000" />
+        <register type="NOA" address="0x00009888" value="0x0B808000" />
+        <register type="NOA" address="0x00009888" value="0x0380C000" />
+        <register type="NOA" address="0x00009888" value="0x0F8A0075" />
+        <register type="NOA" address="0x00009888" value="0x1D8A0000" />
+        <register type="NOA" address="0x00009888" value="0x118A8000" />
+        <register type="NOA" address="0x00009888" value="0x1B8A4000" />
+        <register type="NOA" address="0x00009888" value="0x138A8000" />
+        <register type="NOA" address="0x00009888" value="0x1D81A000" />
+        <register type="NOA" address="0x00009888" value="0x15818000" />
+        <register type="NOA" address="0x00009888" value="0x17818000" />
+        <register type="NOA" address="0x00009888" value="0x0B820030" />
+        <register type="NOA" address="0x00009888" value="0x07828000" />
+        <register type="NOA" address="0x00009888" value="0x0D824000" />
+        <register type="NOA" address="0x00009888" value="0x0F828000" />
+        <register type="NOA" address="0x00009888" value="0x05824000" />
+        <register type="NOA" address="0x00009888" value="0x0D830003" />
+        <register type="NOA" address="0x00009888" value="0x0583000C" />
+        <register type="NOA" address="0x00009888" value="0x09830000" />
+        <register type="NOA" address="0x00009888" value="0x03838000" />
+        <register type="NOA" address="0x00009888" value="0x07838000" />
+        <register type="NOA" address="0x00009888" value="0x0B840980" />
+        <register type="NOA" address="0x00009888" value="0x03844D80" />
+        <register type="NOA" address="0x00009888" value="0x11840000" />
+        <register type="NOA" address="0x00009888" value="0x09848000" />
+        <register type="NOA" address="0x00009888" value="0x09850080" />
+        <register type="NOA" address="0x00009888" value="0x03850003" />
+        <register type="NOA" address="0x00009888" value="0x01850000" />
+        <register type="NOA" address="0x00009888" value="0x07860000" />
+        <register type="NOA" address="0x00009888" value="0x0F860400" />
+        <register type="NOA" address="0x00009888" value="0x09870032" />
+        <register type="NOA" address="0x00009888" value="0x01888052" />
+        <register type="NOA" address="0x00009888" value="0x11880000" />
+        <register type="NOA" address="0x00009888" value="0x09884000" />
+        <register type="NOA" address="0x00009888" value="0x1B931001" />
+        <register type="NOA" address="0x00009888" value="0x1D930001" />
+        <register type="NOA" address="0x00009888" value="0x19934000" />
+        <register type="NOA" address="0x00009888" value="0x1B958000" />
+        <register type="NOA" address="0x00009888" value="0x1D950094" />
+        <register type="NOA" address="0x00009888" value="0x19958000" />
+        <register type="NOA" address="0x00009888" value="0x05E5A000" />
+        <register type="NOA" address="0x00009888" value="0x01E5C000" />
+        <register type="NOA" address="0x00009888" value="0x0592C000" />
+        <register type="NOA" address="0x00009888" value="0x0B928000" />
+        <register type="NOA" address="0x00009888" value="0x0D924000" />
+        <register type="NOA" address="0x00009888" value="0x0F924000" />
+        <register type="NOA" address="0x00009888" value="0x11928000" />
+        <register type="NOA" address="0x00009888" value="0x1392C000" />
+        <register type="NOA" address="0x00009888" value="0x09924000" />
+        <register type="NOA" address="0x00009888" value="0x01985000" />
+        <register type="NOA" address="0x00009888" value="0x07988000" />
+        <register type="NOA" address="0x00009888" value="0x09981000" />
+        <register type="NOA" address="0x00009888" value="0x0B982000" />
+        <register type="NOA" address="0x00009888" value="0x0D982000" />
+        <register type="NOA" address="0x00009888" value="0x0F989000" />
+        <register type="NOA" address="0x00009888" value="0x05982000" />
+        <register type="NOA" address="0x00009888" value="0x13904000" />
+        <register type="NOA" address="0x00009888" value="0x21904000" />
+        <register type="NOA" address="0x00009888" value="0x23904000" />
+        <register type="NOA" address="0x00009888" value="0x25908000" />
+        <register type="NOA" address="0x00009888" value="0x27904000" />
+        <register type="NOA" address="0x00009888" value="0x29908000" />
+        <register type="NOA" address="0x00009888" value="0x2B904000" />
+        <register type="NOA" address="0x00009888" value="0x2F904000" />
+        <register type="NOA" address="0x00009888" value="0x31904000" />
+        <register type="NOA" address="0x00009888" value="0x15904000" />
+        <register type="NOA" address="0x00009888" value="0x17908000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B904000" />
+        <register type="NOA" address="0x00009888" value="0x1190C080" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x419010A0" />
+        <register type="NOA" address="0x00009888" value="0x55904000" />
+        <register type="NOA" address="0x00009888" value="0x45901000" />
+        <register type="NOA" address="0x00009888" value="0x47900084" />
+        <register type="NOA" address="0x00009888" value="0x57904400" />
+        <register type="NOA" address="0x00009888" value="0x499000A5" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900081" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x439014A4" />
+        <register type="NOA" address="0x00009888" value="0x53900400" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007FFEA" />
+        <register type="OA" address="0x00002774" value="0x00007FFC" />
+        <register type="OA" address="0x00002778" value="0x0007AFFA" />
+        <register type="OA" address="0x0000277C" value="0x0000F5FD" />
+        <register type="OA" address="0x00002780" value="0x00079FFA" />
+        <register type="OA" address="0x00002784" value="0x0000F3FB" />
+        <register type="OA" address="0x00002788" value="0x0007BF7A" />
+        <register type="OA" address="0x0000278C" value="0x0000F7E7" />
+        <register type="OA" address="0x00002790" value="0x0007FEFA" />
+        <register type="OA" address="0x00002794" value="0x0000F7CF" />
+        <register type="OA" address="0x00002798" value="0x00077FFA" />
+        <register type="OA" address="0x0000279C" value="0x0000EFDF" />
+        <register type="OA" address="0x000027A0" value="0x0006FFFA" />
+        <register type="OA" address="0x000027A4" value="0x0000CFBF" />
+        <register type="OA" address="0x000027A8" value="0x0003FFFA" />
+        <register type="OA" address="0x000027AC" value="0x00005F7F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00015014" />
+        <register type="FLEX" address="0x0000E658" value="0x00025024" />
+        <register type="FLEX" address="0x0000E758" value="0x00035034" />
+        <register type="FLEX" address="0x0000E45C" value="0x00045044" />
+        <register type="FLEX" address="0x0000E55C" value="0x00055054" />
+        <register type="FLEX" address="0x0000E65C" value="0x00065064" />
+    </register_config>
+  </set>
+
+  <set name="Memory Reads Distribution Gen9"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="memory_reads"
+       hw_config_guid="246b35f1-44e0-4d03-8936-e452e291d064"
+       chipset="SKLGT2"
+       symbol_name="MemoryReads"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiL3Bank0Reads"
+             description="The total number of GTI memory reads from L3 Bank 0 (L3 Cache misses)."
+             data_type="uint64"
+             equation="C 4 READ"
+             underscore_name="gti_l3_bank0_reads"
+             units="messages"
+             symbol_name="GtiL3Bank0Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="GtiRingAccesses"
+             description="The total number of all accesses from GTI to the ring."
+             data_type="uint64"
+             equation="C 3 READ 2 UMUL"
+             underscore_name="gti_ring_accesses"
+             units="messages"
+             symbol_name="GtiRingAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="GtiL3Bank3Reads"
+             description="The total number of GTI memory reads from L3 Bank 3 (L3 Cache misses)."
+             data_type="uint64"
+             equation="C 7 READ"
+             underscore_name="gti_l3_bank3_reads"
+             units="messages"
+             symbol_name="GtiL3Bank3Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="GtiRsMemoryReads"
+             description="The total number of GTI memory reads from Resource Streamer."
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="gti_rs_memory_reads"
+             units="messages"
+             symbol_name="GtiRsMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Resource Streamer"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GtiHizMemoryReads"
+             description="The total number of GTI memory reads from Hierarchical Depth Cache (Hi-Depth Cache misses)."
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="gti_hiz_memory_reads"
+             units="messages"
+             symbol_name="GtiHizMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="GtiRccMemoryReads"
+             description="The total number of GTI memory reads from Render Color Cache (Render Color Cache misses)."
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="gti_rcc_memory_reads"
+             units="messages"
+             symbol_name="GtiRccMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Color Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiL3Bank1Reads"
+             description="The total number of GTI memory reads from L3 Bank 1 (L3 Cache misses)."
+             data_type="uint64"
+             equation="C 5 READ"
+             underscore_name="gti_l3_bank1_reads"
+             units="messages"
+             symbol_name="GtiL3Bank1Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiCmdStreamerMemoryReads"
+             description="The total number of GTI memory reads from Command Streamer."
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="gti_cmd_streamer_memory_reads"
+             units="messages"
+             symbol_name="GtiCmdStreamerMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Command Streamer"
+             />
+    <counter name="GtiL3Bank2Reads"
+             description="The total number of GTI memory reads from L3 Bank 2 (L3 Cache misses)."
+             data_type="uint64"
+             equation="C 6 READ"
+             underscore_name="gti_l3_bank2_reads"
+             units="messages"
+             symbol_name="GtiL3Bank2Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiMemoryReads"
+             description="The total number of GTI memory reads."
+             data_type="uint64"
+             equation="C 0 READ"
+             underscore_name="gti_memory_reads"
+             units="messages"
+             symbol_name="GtiMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="GtiRczMemoryReads"
+             description="The total number of GTI memory reads from Render Depth Cache (Render Depth Cache misses)."
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="gti_rcz_memory_reads"
+             units="messages"
+             symbol_name="GtiRczMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="GtiMscMemoryReads"
+             description="The total number of GTI memory reads from Multisampling Color Cache (Multisampling Color Cache misses)."
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="gti_msc_memory_reads"
+             units="messages"
+             symbol_name="GtiMscMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Color Cache"
+             />
+    <counter name="GtiVfMemoryReads"
+             description="The total number of GTI memory reads from Vertex Fetch."
+             data_type="uint64"
+             equation="B 1 READ"
+             underscore_name="gti_vf_memory_reads"
+             units="messages"
+             symbol_name="GtiVfMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Vertex Fetch"
+             />
+    <counter name="GtiStcMemoryReads"
+             description="The total number of GTI memory reads from Stencil Cache (Stencil Cache misses)."
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="gti_stc_memory_reads"
+             units="messages"
+             symbol_name="GtiStcMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiL3Reads"
+             description="The total number of GTI memory reads from L3 (L3 Cache misses)."
+             data_type="uint64"
+             equation="$GtiL3Bank0Reads $GtiL3Bank1Reads $GtiL3Bank2Reads $GtiL3Bank3Reads UADD UADD UADD"
+             underscore_name="gti_l3_reads"
+             units="messages"
+             symbol_name="GtiL3Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA"
+                     availability="$SliceMask 0x01 AND $SkuRevisionId 0x02 ULT &&"
+                     priority="0"
+                     >
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x11810C00" />
+        <register type="NOA" address="0x00009888" value="0x1381001A" />
+        <register type="NOA" address="0x00009888" value="0x13946000" />
+        <register type="NOA" address="0x00009888" value="0x37906800" />
+        <register type="NOA" address="0x00009888" value="0x3F900003" />
+        <register type="NOA" address="0x00009888" value="0x03811300" />
+        <register type="NOA" address="0x00009888" value="0x05811B12" />
+        <register type="NOA" address="0x00009888" value="0x0781001A" />
+        <register type="NOA" address="0x00009888" value="0x1F810000" />
+        <register type="NOA" address="0x00009888" value="0x17810000" />
+        <register type="NOA" address="0x00009888" value="0x19810000" />
+        <register type="NOA" address="0x00009888" value="0x1B810000" />
+        <register type="NOA" address="0x00009888" value="0x1D810000" />
+        <register type="NOA" address="0x00009888" value="0x0F968000" />
+        <register type="NOA" address="0x00009888" value="0x1196C000" />
+        <register type="NOA" address="0x00009888" value="0x13964000" />
+        <register type="NOA" address="0x00009888" value="0x11938000" />
+        <register type="NOA" address="0x00009888" value="0x1B93FE00" />
+        <register type="NOA" address="0x00009888" value="0x01940010" />
+        <register type="NOA" address="0x00009888" value="0x07941100" />
+        <register type="NOA" address="0x00009888" value="0x09941312" />
+        <register type="NOA" address="0x00009888" value="0x0B941514" />
+        <register type="NOA" address="0x00009888" value="0x0D941716" />
+        <register type="NOA" address="0x00009888" value="0x11940000" />
+        <register type="NOA" address="0x00009888" value="0x19940000" />
+        <register type="NOA" address="0x00009888" value="0x1B940000" />
+        <register type="NOA" address="0x00009888" value="0x1D940000" />
+        <register type="NOA" address="0x00009888" value="0x1B954000" />
+        <register type="NOA" address="0x00009888" value="0x1D95A550" />
+        <register type="NOA" address="0x00009888" value="0x1F9502AA" />
+        <register type="NOA" address="0x00009888" value="0x2F900157" />
+        <register type="NOA" address="0x00009888" value="0x31900105" />
+        <register type="NOA" address="0x00009888" value="0x15900103" />
+        <register type="NOA" address="0x00009888" value="0x17900101" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x13908000" />
+        <register type="NOA" address="0x00009888" value="0x21908000" />
+        <register type="NOA" address="0x00009888" value="0x23908000" />
+        <register type="NOA" address="0x00009888" value="0x25908000" />
+        <register type="NOA" address="0x00009888" value="0x27908000" />
+        <register type="NOA" address="0x00009888" value="0x29908000" />
+        <register type="NOA" address="0x00009888" value="0x2B908000" />
+        <register type="NOA" address="0x00009888" value="0x2D908000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B908000" />
+        <register type="NOA" address="0x00009888" value="0x1D908000" />
+        <register type="NOA" address="0x00009888" value="0x1F908000" />
+        <register type="NOA" address="0x00009888" value="0x11900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900C00" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900000" />
+        <register type="NOA" address="0x00009888" value="0x47900000" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900063" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x43900003" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+    </register_config>
+    <register_config type="NOA"
+                     availability="$SkuRevisionId 0x05 ULT $SkuRevisionId 0x02 UGTE &&"
+                     priority="0"
+                     >
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x11810C00" />
+        <register type="NOA" address="0x00009888" value="0x1381001A" />
+        <register type="NOA" address="0x00009888" value="0x13946000" />
+        <register type="NOA" address="0x00009888" value="0x15940016" />
+        <register type="NOA" address="0x00009888" value="0x37906800" />
+        <register type="NOA" address="0x00009888" value="0x03811300" />
+        <register type="NOA" address="0x00009888" value="0x05811B12" />
+        <register type="NOA" address="0x00009888" value="0x0781001A" />
+        <register type="NOA" address="0x00009888" value="0x1F810000" />
+        <register type="NOA" address="0x00009888" value="0x17810000" />
+        <register type="NOA" address="0x00009888" value="0x19810000" />
+        <register type="NOA" address="0x00009888" value="0x1B810000" />
+        <register type="NOA" address="0x00009888" value="0x1D810000" />
+        <register type="NOA" address="0x00009888" value="0x19930800" />
+        <register type="NOA" address="0x00009888" value="0x1B93AA55" />
+        <register type="NOA" address="0x00009888" value="0x1D9300AA" />
+        <register type="NOA" address="0x00009888" value="0x01940010" />
+        <register type="NOA" address="0x00009888" value="0x07941100" />
+        <register type="NOA" address="0x00009888" value="0x09941312" />
+        <register type="NOA" address="0x00009888" value="0x0B941514" />
+        <register type="NOA" address="0x00009888" value="0x0D941716" />
+        <register type="NOA" address="0x00009888" value="0x0F940018" />
+        <register type="NOA" address="0x00009888" value="0x1B940000" />
+        <register type="NOA" address="0x00009888" value="0x11940000" />
+        <register type="NOA" address="0x00009888" value="0x01E58000" />
+        <register type="NOA" address="0x00009888" value="0x03E57000" />
+        <register type="NOA" address="0x00009888" value="0x31900105" />
+        <register type="NOA" address="0x00009888" value="0x15900103" />
+        <register type="NOA" address="0x00009888" value="0x17900101" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x13908000" />
+        <register type="NOA" address="0x00009888" value="0x21908000" />
+        <register type="NOA" address="0x00009888" value="0x23908000" />
+        <register type="NOA" address="0x00009888" value="0x25908000" />
+        <register type="NOA" address="0x00009888" value="0x27908000" />
+        <register type="NOA" address="0x00009888" value="0x29908000" />
+        <register type="NOA" address="0x00009888" value="0x2B908000" />
+        <register type="NOA" address="0x00009888" value="0x2D908000" />
+        <register type="NOA" address="0x00009888" value="0x2F908000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B908000" />
+        <register type="NOA" address="0x00009888" value="0x1D908000" />
+        <register type="NOA" address="0x00009888" value="0x1F908000" />
+        <register type="NOA" address="0x00009888" value="0x11900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900C20" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900400" />
+        <register type="NOA" address="0x00009888" value="0x47900421" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900421" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900061" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x43900003" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+    </register_config>
+    <register_config type="NOA"
+                     availability="$SkuRevisionId 0x05 UGTE"
+                     priority="0"
+                     >
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x11810C00" />
+        <register type="NOA" address="0x00009888" value="0x1381001A" />
+        <register type="NOA" address="0x00009888" value="0x37906800" />
+        <register type="NOA" address="0x00009888" value="0x3F900064" />
+        <register type="NOA" address="0x00009888" value="0x03811300" />
+        <register type="NOA" address="0x00009888" value="0x05811B12" />
+        <register type="NOA" address="0x00009888" value="0x0781001A" />
+        <register type="NOA" address="0x00009888" value="0x1F810000" />
+        <register type="NOA" address="0x00009888" value="0x17810000" />
+        <register type="NOA" address="0x00009888" value="0x19810000" />
+        <register type="NOA" address="0x00009888" value="0x1B810000" />
+        <register type="NOA" address="0x00009888" value="0x1D810000" />
+        <register type="NOA" address="0x00009888" value="0x1B930055" />
+        <register type="NOA" address="0x00009888" value="0x03E58000" />
+        <register type="NOA" address="0x00009888" value="0x05E5C000" />
+        <register type="NOA" address="0x00009888" value="0x07E54000" />
+        <register type="NOA" address="0x00009888" value="0x13900150" />
+        <register type="NOA" address="0x00009888" value="0x21900151" />
+        <register type="NOA" address="0x00009888" value="0x23900152" />
+        <register type="NOA" address="0x00009888" value="0x25900153" />
+        <register type="NOA" address="0x00009888" value="0x27900154" />
+        <register type="NOA" address="0x00009888" value="0x29900155" />
+        <register type="NOA" address="0x00009888" value="0x2B900156" />
+        <register type="NOA" address="0x00009888" value="0x2D900157" />
+        <register type="NOA" address="0x00009888" value="0x2F90015F" />
+        <register type="NOA" address="0x00009888" value="0x31900105" />
+        <register type="NOA" address="0x00009888" value="0x15900103" />
+        <register type="NOA" address="0x00009888" value="0x17900101" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B908000" />
+        <register type="NOA" address="0x00009888" value="0x1D908000" />
+        <register type="NOA" address="0x00009888" value="0x1F908000" />
+        <register type="NOA" address="0x00009888" value="0x11900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900C60" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900C00" />
+        <register type="NOA" address="0x00009888" value="0x47900C63" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900C63" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900063" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x43900003" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x0000272C" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002728" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x0000271C" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002718" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x0000274C" value="0x86543210" />
+        <register type="OA" address="0x00002748" value="0x86543210" />
+        <register type="OA" address="0x00002744" value="0x00006667" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x0000275C" value="0x86543210" />
+        <register type="OA" address="0x00002758" value="0x86543210" />
+        <register type="OA" address="0x00002754" value="0x00006465" />
+        <register type="OA" address="0x00002750" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007F81A" />
+        <register type="OA" address="0x00002774" value="0x0000FE00" />
+        <register type="OA" address="0x00002778" value="0x0007F82A" />
+        <register type="OA" address="0x0000277C" value="0x0000FE00" />
+        <register type="OA" address="0x00002780" value="0x0007F872" />
+        <register type="OA" address="0x00002784" value="0x0000FE00" />
+        <register type="OA" address="0x00002788" value="0x0007F8BA" />
+        <register type="OA" address="0x0000278C" value="0x0000FE00" />
+        <register type="OA" address="0x00002790" value="0x0007F87A" />
+        <register type="OA" address="0x00002794" value="0x0000FE00" />
+        <register type="OA" address="0x00002798" value="0x0007F8EA" />
+        <register type="OA" address="0x0000279C" value="0x0000FE00" />
+        <register type="OA" address="0x000027A0" value="0x0007F8E2" />
+        <register type="OA" address="0x000027A4" value="0x0000FE00" />
+        <register type="OA" address="0x000027A8" value="0x0007F8F2" />
+        <register type="OA" address="0x000027AC" value="0x0000FE00" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00015014" />
+        <register type="FLEX" address="0x0000E658" value="0x00025024" />
+        <register type="FLEX" address="0x0000E758" value="0x00035034" />
+        <register type="FLEX" address="0x0000E45C" value="0x00045044" />
+        <register type="FLEX" address="0x0000E55C" value="0x00055054" />
+        <register type="FLEX" address="0x0000E65C" value="0x00065064" />
+    </register_config>
+  </set>
+
+  <set name="Memory Writes Distribution Gen9"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="memory_writes"
+       hw_config_guid="e0d3da02-00bf-4a96-9795-b48158c73a68"
+       chipset="SKLGT2"
+       symbol_name="MemoryWrites"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiMemoryWrites"
+             description="The total number of GTI memory writes."
+             data_type="uint64"
+             equation="C 0 READ"
+             underscore_name="gti_memory_writes"
+             units="messages"
+             symbol_name="GtiMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="GtiRingAccesses"
+             description="The total number of all GTI accesses to the ring."
+             data_type="uint64"
+             equation="C 3 READ 2 UMUL"
+             underscore_name="gti_ring_accesses"
+             units="messages"
+             symbol_name="GtiRingAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="GtiMscMemoryWrites"
+             description="The total number of GTI memory writes from Multisampling Color Cache (Multisampling Color Cache invalidations)."
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="gti_msc_memory_writes"
+             units="messages"
+             symbol_name="GtiMscMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Color Cache"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="GtiCmdStreamerMemoryWrites"
+             description="The total number of GTI memory writes from Command Streamer."
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="gti_cmd_streamer_memory_writes"
+             units="messages"
+             symbol_name="GtiCmdStreamerMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Command Streamer"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GtiL3Bank0Writes"
+             description="The total number of GTI memory writes from L3 Bank 0 (L3 Bank 0 invalidations)."
+             data_type="uint64"
+             equation="C 4 READ"
+             underscore_name="gti_l3_bank0_writes"
+             units="messages"
+             symbol_name="GtiL3Bank0Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiL3Bank1Writes"
+             description="The total number of GTI memory writes from L3 Bank 1 (L3 Bank 1 invalidations)."
+             data_type="uint64"
+             equation="C 5 READ"
+             underscore_name="gti_l3_bank1_writes"
+             units="messages"
+             symbol_name="GtiL3Bank1Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiL3Bank2Writes"
+             description="The total number of GTI memory writes from L3 Bank 2 (L3 Bank 2 invalidations)."
+             data_type="uint64"
+             equation="C 6 READ"
+             underscore_name="gti_l3_bank2_writes"
+             units="messages"
+             symbol_name="GtiL3Bank2Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiL3Bank3Writes"
+             description="The total number of GTI memory writes from L3 Bank 3 (L3 Bank 3 invalidations)."
+             data_type="uint64"
+             equation="C 7 READ"
+             underscore_name="gti_l3_bank3_writes"
+             units="messages"
+             symbol_name="GtiL3Bank3Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiL3Writes"
+             description="The total number of GTI memory writes from L3 (L3 invalidations)."
+             data_type="uint64"
+             equation="$GtiL3Bank0Writes $GtiL3Bank1Writes $GtiL3Bank2Writes $GtiL3Bank3Writes UADD UADD UADD"
+             underscore_name="gti_l3_writes"
+             units="messages"
+             symbol_name="GtiL3Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiRccMemoryWrites"
+             description="The total number of GTI memory writes from Render Color Cache (Render Color Cache invalidations)."
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="gti_rcc_memory_writes"
+             units="messages"
+             symbol_name="GtiRccMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Color Cache"
+             />
+    <counter name="GtiSoMemoryWrites"
+             description="The total number of GTI memory writes from Stream Output."
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="gti_so_memory_writes"
+             units="messages"
+             symbol_name="GtiSoMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Stream Output"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiStcMemoryWrites"
+             description="The total number of GTI memory writes from Stencil Cache."
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="gti_stc_memory_writes"
+             units="messages"
+             symbol_name="GtiStcMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="GtiRczMemoryWrites"
+             description="The total number of GTI memory writes from Render Depth Cache."
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="gti_rcz_memory_writes"
+             units="messages"
+             symbol_name="GtiRczMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="GtiHizMemoryWrites"
+             description="The total number of GTI memory writes from Hierarchical Depth Cache."
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="gti_hiz_memory_writes"
+             units="messages"
+             symbol_name="GtiHizMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA"
+                     availability="$SliceMask 0x01 AND $SkuRevisionId 0x02 ULT &&"
+                     priority="0"
+                     >
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x11810C00" />
+        <register type="NOA" address="0x00009888" value="0x1381001A" />
+        <register type="NOA" address="0x00009888" value="0x13945400" />
+        <register type="NOA" address="0x00009888" value="0x37906800" />
+        <register type="NOA" address="0x00009888" value="0x3F901400" />
+        <register type="NOA" address="0x00009888" value="0x03811300" />
+        <register type="NOA" address="0x00009888" value="0x05811B12" />
+        <register type="NOA" address="0x00009888" value="0x0781001A" />
+        <register type="NOA" address="0x00009888" value="0x1F810000" />
+        <register type="NOA" address="0x00009888" value="0x17810000" />
+        <register type="NOA" address="0x00009888" value="0x19810000" />
+        <register type="NOA" address="0x00009888" value="0x1B810000" />
+        <register type="NOA" address="0x00009888" value="0x1D810000" />
+        <register type="NOA" address="0x00009888" value="0x0F968000" />
+        <register type="NOA" address="0x00009888" value="0x1196C000" />
+        <register type="NOA" address="0x00009888" value="0x13964000" />
+        <register type="NOA" address="0x00009888" value="0x11938000" />
+        <register type="NOA" address="0x00009888" value="0x1B93FE00" />
+        <register type="NOA" address="0x00009888" value="0x01940010" />
+        <register type="NOA" address="0x00009888" value="0x07941100" />
+        <register type="NOA" address="0x00009888" value="0x09941312" />
+        <register type="NOA" address="0x00009888" value="0x0B941514" />
+        <register type="NOA" address="0x00009888" value="0x0D941716" />
+        <register type="NOA" address="0x00009888" value="0x11940000" />
+        <register type="NOA" address="0x00009888" value="0x19940000" />
+        <register type="NOA" address="0x00009888" value="0x1B940000" />
+        <register type="NOA" address="0x00009888" value="0x1D940000" />
+        <register type="NOA" address="0x00009888" value="0x1B954000" />
+        <register type="NOA" address="0x00009888" value="0x1D95A550" />
+        <register type="NOA" address="0x00009888" value="0x1F9502AA" />
+        <register type="NOA" address="0x00009888" value="0x2F900167" />
+        <register type="NOA" address="0x00009888" value="0x31900105" />
+        <register type="NOA" address="0x00009888" value="0x15900103" />
+        <register type="NOA" address="0x00009888" value="0x17900101" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x13908000" />
+        <register type="NOA" address="0x00009888" value="0x21908000" />
+        <register type="NOA" address="0x00009888" value="0x23908000" />
+        <register type="NOA" address="0x00009888" value="0x25908000" />
+        <register type="NOA" address="0x00009888" value="0x27908000" />
+        <register type="NOA" address="0x00009888" value="0x29908000" />
+        <register type="NOA" address="0x00009888" value="0x2B908000" />
+        <register type="NOA" address="0x00009888" value="0x2D908000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B908000" />
+        <register type="NOA" address="0x00009888" value="0x1D908000" />
+        <register type="NOA" address="0x00009888" value="0x1F908000" />
+        <register type="NOA" address="0x00009888" value="0x11900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900C00" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900000" />
+        <register type="NOA" address="0x00009888" value="0x47900000" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900063" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x43900003" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x11810C00" />
+        <register type="NOA" address="0x00009888" value="0x1381001A" />
+        <register type="NOA" address="0x00009888" value="0x37906800" />
+        <register type="NOA" address="0x00009888" value="0x3F901000" />
+        <register type="NOA" address="0x00009888" value="0x03811300" />
+        <register type="NOA" address="0x00009888" value="0x05811B12" />
+        <register type="NOA" address="0x00009888" value="0x0781001A" />
+        <register type="NOA" address="0x00009888" value="0x1F810000" />
+        <register type="NOA" address="0x00009888" value="0x17810000" />
+        <register type="NOA" address="0x00009888" value="0x19810000" />
+        <register type="NOA" address="0x00009888" value="0x1B810000" />
+        <register type="NOA" address="0x00009888" value="0x1D810000" />
+        <register type="NOA" address="0x00009888" value="0x1B930055" />
+        <register type="NOA" address="0x00009888" value="0x03E58000" />
+        <register type="NOA" address="0x00009888" value="0x05E5C000" />
+        <register type="NOA" address="0x00009888" value="0x07E54000" />
+        <register type="NOA" address="0x00009888" value="0x13900160" />
+        <register type="NOA" address="0x00009888" value="0x21900161" />
+        <register type="NOA" address="0x00009888" value="0x23900162" />
+        <register type="NOA" address="0x00009888" value="0x25900163" />
+        <register type="NOA" address="0x00009888" value="0x27900164" />
+        <register type="NOA" address="0x00009888" value="0x29900165" />
+        <register type="NOA" address="0x00009888" value="0x2B900166" />
+        <register type="NOA" address="0x00009888" value="0x2D900167" />
+        <register type="NOA" address="0x00009888" value="0x2F900150" />
+        <register type="NOA" address="0x00009888" value="0x31900105" />
+        <register type="NOA" address="0x00009888" value="0x15900103" />
+        <register type="NOA" address="0x00009888" value="0x17900101" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B908000" />
+        <register type="NOA" address="0x00009888" value="0x1D908000" />
+        <register type="NOA" address="0x00009888" value="0x1F908000" />
+        <register type="NOA" address="0x00009888" value="0x11900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900C60" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900C00" />
+        <register type="NOA" address="0x00009888" value="0x47900C63" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900C63" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900063" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x43900003" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+    </register_config>
+    <register_config type="NOA"
+                     availability="$SkuRevisionId 0x05 ULT $SkuRevisionId 0x02 UGTE &&"
+                     priority="0"
+                     >
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x11810C00" />
+        <register type="NOA" address="0x00009888" value="0x1381001A" />
+        <register type="NOA" address="0x00009888" value="0x13945400" />
+        <register type="NOA" address="0x00009888" value="0x37906800" />
+        <register type="NOA" address="0x00009888" value="0x3F901400" />
+        <register type="NOA" address="0x00009888" value="0x03811300" />
+        <register type="NOA" address="0x00009888" value="0x05811B12" />
+        <register type="NOA" address="0x00009888" value="0x0781001A" />
+        <register type="NOA" address="0x00009888" value="0x1F810000" />
+        <register type="NOA" address="0x00009888" value="0x17810000" />
+        <register type="NOA" address="0x00009888" value="0x19810000" />
+        <register type="NOA" address="0x00009888" value="0x1B810000" />
+        <register type="NOA" address="0x00009888" value="0x1D810000" />
+        <register type="NOA" address="0x00009888" value="0x19930800" />
+        <register type="NOA" address="0x00009888" value="0x1B93AA55" />
+        <register type="NOA" address="0x00009888" value="0x1D93002A" />
+        <register type="NOA" address="0x00009888" value="0x01940010" />
+        <register type="NOA" address="0x00009888" value="0x07941100" />
+        <register type="NOA" address="0x00009888" value="0x09941312" />
+        <register type="NOA" address="0x00009888" value="0x0B941514" />
+        <register type="NOA" address="0x00009888" value="0x0D941716" />
+        <register type="NOA" address="0x00009888" value="0x1B940000" />
+        <register type="NOA" address="0x00009888" value="0x11940000" />
+        <register type="NOA" address="0x00009888" value="0x01E58000" />
+        <register type="NOA" address="0x00009888" value="0x03E57000" />
+        <register type="NOA" address="0x00009888" value="0x2F900167" />
+        <register type="NOA" address="0x00009888" value="0x31900105" />
+        <register type="NOA" address="0x00009888" value="0x15900103" />
+        <register type="NOA" address="0x00009888" value="0x17900101" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x13908000" />
+        <register type="NOA" address="0x00009888" value="0x21908000" />
+        <register type="NOA" address="0x00009888" value="0x23908000" />
+        <register type="NOA" address="0x00009888" value="0x25908000" />
+        <register type="NOA" address="0x00009888" value="0x27908000" />
+        <register type="NOA" address="0x00009888" value="0x29908000" />
+        <register type="NOA" address="0x00009888" value="0x2B908000" />
+        <register type="NOA" address="0x00009888" value="0x2D908000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B908000" />
+        <register type="NOA" address="0x00009888" value="0x1D908000" />
+        <register type="NOA" address="0x00009888" value="0x1F908000" />
+        <register type="NOA" address="0x00009888" value="0x11900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900C20" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900400" />
+        <register type="NOA" address="0x00009888" value="0x47900421" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900421" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900063" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x43900003" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x11810C00" />
+        <register type="NOA" address="0x00009888" value="0x1381001A" />
+        <register type="NOA" address="0x00009888" value="0x37906800" />
+        <register type="NOA" address="0x00009888" value="0x3F901000" />
+        <register type="NOA" address="0x00009888" value="0x03811300" />
+        <register type="NOA" address="0x00009888" value="0x05811B12" />
+        <register type="NOA" address="0x00009888" value="0x0781001A" />
+        <register type="NOA" address="0x00009888" value="0x1F810000" />
+        <register type="NOA" address="0x00009888" value="0x17810000" />
+        <register type="NOA" address="0x00009888" value="0x19810000" />
+        <register type="NOA" address="0x00009888" value="0x1B810000" />
+        <register type="NOA" address="0x00009888" value="0x1D810000" />
+        <register type="NOA" address="0x00009888" value="0x1B930055" />
+        <register type="NOA" address="0x00009888" value="0x03E58000" />
+        <register type="NOA" address="0x00009888" value="0x05E5C000" />
+        <register type="NOA" address="0x00009888" value="0x07E54000" />
+        <register type="NOA" address="0x00009888" value="0x13900160" />
+        <register type="NOA" address="0x00009888" value="0x21900161" />
+        <register type="NOA" address="0x00009888" value="0x23900162" />
+        <register type="NOA" address="0x00009888" value="0x25900163" />
+        <register type="NOA" address="0x00009888" value="0x27900164" />
+        <register type="NOA" address="0x00009888" value="0x29900165" />
+        <register type="NOA" address="0x00009888" value="0x2B900166" />
+        <register type="NOA" address="0x00009888" value="0x2D900167" />
+        <register type="NOA" address="0x00009888" value="0x2F900150" />
+        <register type="NOA" address="0x00009888" value="0x31900105" />
+        <register type="NOA" address="0x00009888" value="0x15900103" />
+        <register type="NOA" address="0x00009888" value="0x17900101" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B908000" />
+        <register type="NOA" address="0x00009888" value="0x1D908000" />
+        <register type="NOA" address="0x00009888" value="0x1F908000" />
+        <register type="NOA" address="0x00009888" value="0x11900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900C60" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900C00" />
+        <register type="NOA" address="0x00009888" value="0x47900C63" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900C63" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900063" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x43900003" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x0000272C" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002728" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x0000271C" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002718" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x0000274C" value="0x86543210" />
+        <register type="OA" address="0x00002748" value="0x86543210" />
+        <register type="OA" address="0x00002744" value="0x00006667" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x0000275C" value="0x86543210" />
+        <register type="OA" address="0x00002758" value="0x86543210" />
+        <register type="OA" address="0x00002754" value="0x00006465" />
+        <register type="OA" address="0x00002750" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007F81A" />
+        <register type="OA" address="0x00002774" value="0x0000FE00" />
+        <register type="OA" address="0x00002778" value="0x0007F82A" />
+        <register type="OA" address="0x0000277C" value="0x0000FE00" />
+        <register type="OA" address="0x00002780" value="0x0007F822" />
+        <register type="OA" address="0x00002784" value="0x0000FE00" />
+        <register type="OA" address="0x00002788" value="0x0007F8BA" />
+        <register type="OA" address="0x0000278C" value="0x0000FE00" />
+        <register type="OA" address="0x00002790" value="0x0007F87A" />
+        <register type="OA" address="0x00002794" value="0x0000FE00" />
+        <register type="OA" address="0x00002798" value="0x0007F8EA" />
+        <register type="OA" address="0x0000279C" value="0x0000FE00" />
+        <register type="OA" address="0x000027A0" value="0x0007F8E2" />
+        <register type="OA" address="0x000027A4" value="0x0000FE00" />
+        <register type="OA" address="0x000027A8" value="0x0007F8F2" />
+        <register type="OA" address="0x000027AC" value="0x0000FE00" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00015014" />
+        <register type="FLEX" address="0x0000E658" value="0x00025024" />
+        <register type="FLEX" address="0x0000E758" value="0x00035034" />
+        <register type="FLEX" address="0x0000E45C" value="0x00045044" />
+        <register type="FLEX" address="0x0000E55C" value="0x00055054" />
+        <register type="FLEX" address="0x0000E65C" value="0x00065064" />
+    </register_config>
+  </set>
+
+  <set name="Compute Metrics Extended Gen9"
+       mdapi_supported_apis="VK OGL4 OCL IO BB"
+       underscore_name="compute_extended"
+       hw_config_guid="c26b1fda-2752-4a33-a448-4c8718366846"
+       chipset="SKLGT2"
+       symbol_name="ComputeExtended"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu0_active"
+             units="percent"
+             symbol_name="Fpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active"
+             units="percent"
+             symbol_name="Fpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU AVG IPC Rate"
+             description="The average rate of IPC calculated for 2 FPU pipelines."
+             data_type="float"
+             max_equation="2"
+             equation="A 9 READ  A 10 READ  A 11 READ UADD  A 9 READ USUB FDIV 1 FADD"
+             underscore_name="eu_avg_ipc_rate"
+             units="number"
+             symbol_name="EuAvgIpcRate"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Typed Writes 0"
+             description="The subslice 0 typed writes."
+             data_type="uint64"
+             equation="C 0 READ"
+             underscore_name="typed_writes0"
+             units="messages"
+             symbol_name="TypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuTypedAtomics0"
+             description="The subslice 0 EU Typed Atomics subslice 0."
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="eu_typed_atomics0"
+             units="messages"
+             symbol_name="EuTypedAtomics0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Typed Atomics 0"
+             description="The subslice 0 typed atomics."
+             data_type="uint64"
+             equation="C 4 READ"
+             underscore_name="typed_atomics0"
+             units="messages"
+             symbol_name="TypedAtomics0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="TypedAtomicsPerCacheLine"
+             description="The ratio of EU typed atomics requests to L3 cache line writes."
+             data_type="float"
+             equation="$EuTypedAtomics0 $TypedAtomics0 FDIV"
+             underscore_name="typed_atomics_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="TypedAtomicsPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuUntypedReads0"
+             description="The subslice 0 EU Untyped Reads subslice 0."
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="eu_untyped_reads0"
+             units="messages"
+             symbol_name="EuUntypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Untyped Writes 0"
+             description="The subslice 0 untyped writes (including SLM writes)."
+             data_type="uint64"
+             equation="C 1 READ"
+             underscore_name="untyped_writes0"
+             units="messages"
+             symbol_name="UntypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuUntypedAtomics0"
+             description="The subslice 0 EU Untyped Atomics subslice 0."
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="eu_untyped_atomics0"
+             units="messages"
+             symbol_name="EuUntypedAtomics0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuUntypedWrites0"
+             description="The subslice 0 EU Untyped Writes subslice 0."
+             data_type="uint64"
+             equation="B 1 READ"
+             underscore_name="eu_untyped_writes0"
+             units="messages"
+             symbol_name="EuUntypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuA64UntypedWrites0"
+             description="The subslice 0 EU A64 Untyped Writes subslice 0."
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="eu_a64_untyped_writes0"
+             units="messages"
+             symbol_name="EuA64UntypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="UntypedWritesPerCacheLine"
+             description="The ratio of EU untyped write requests to L3 cache line writes."
+             data_type="float"
+             equation="$EuUntypedWrites0 $EuA64UntypedWrites0 UADD $UntypedWrites0 FDIV"
+             underscore_name="untyped_writes_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="UntypedWritesPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EuTypedWrites0"
+             description="The subslice 0 EU Typed Writes subslice 0."
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="eu_typed_writes0"
+             units="messages"
+             symbol_name="EuTypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="TypedWritesPerCacheLine"
+             description="The ratio of EU typed write requests to L3 cache line writes."
+             data_type="float"
+             equation="$EuTypedWrites0 $TypedWrites0 FDIV"
+             underscore_name="typed_writes_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="TypedWritesPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Typed Reads 0"
+             description="The subslice 0 typed reads."
+             data_type="uint64"
+             equation="C 2 READ"
+             underscore_name="typed_reads0"
+             units="messages"
+             symbol_name="TypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Untyped Reads 0"
+             description="The subslice 0 untyped reads (including SLM reads)."
+             data_type="uint64"
+             equation="C 3 READ"
+             underscore_name="untyped_reads0"
+             units="messages"
+             symbol_name="UntypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuA64UntypedReads0"
+             description="The subslice 0 EU A64 Untyped Reads subslice 0."
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="eu_a64_untyped_reads0"
+             units="messages"
+             symbol_name="EuA64UntypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EU Thread Occupancy"
+             description="The percentage of time in which hardware threads occupied EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ 8 UMUL $EuCoresTotalCount UDIV $EuThreadsCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_thread_occupancy"
+             units="percent"
+             symbol_name="EuThreadOccupancy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EuTypedReads0"
+             description="The subslice 0 EU Typed Reads subslice 0."
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="eu_typed_reads0"
+             units="messages"
+             symbol_name="EuTypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="UntypedReadsPerCacheLine"
+             description="The ratio of EU untyped read requests to L3 cache line reads."
+             data_type="float"
+             equation="$EuUntypedReads0 $EuA64UntypedReads0 UADD $UntypedReads0 FDIV"
+             underscore_name="untyped_reads_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="UntypedReadsPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="TypedReadsPerCacheLine"
+             description="The ratio of EU typed read requests to L3 cache line reads."
+             data_type="float"
+             equation="$EuTypedReads0 $TypedReads0 FDIV"
+             underscore_name="typed_reads_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="TypedReadsPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="EU Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_send_active"
+             units="percent"
+             symbol_name="EuSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA"
+                     availability="$SubsliceMask 0x01 AND"
+                     priority="0"
+                     >
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x106C00E0" />
+        <register type="NOA" address="0x00009888" value="0x141C8160" />
+        <register type="NOA" address="0x00009888" value="0x161C8015" />
+        <register type="NOA" address="0x00009888" value="0x181C0120" />
+        <register type="NOA" address="0x00009888" value="0x004E8000" />
+        <register type="NOA" address="0x00009888" value="0x0E4E8000" />
+        <register type="NOA" address="0x00009888" value="0x184E8000" />
+        <register type="NOA" address="0x00009888" value="0x1A4EAAA0" />
+        <register type="NOA" address="0x00009888" value="0x1C4E0002" />
+        <register type="NOA" address="0x00009888" value="0x024E8000" />
+        <register type="NOA" address="0x00009888" value="0x044E8000" />
+        <register type="NOA" address="0x00009888" value="0x064E8000" />
+        <register type="NOA" address="0x00009888" value="0x084E8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4E8000" />
+        <register type="NOA" address="0x00009888" value="0x0E6C0B01" />
+        <register type="NOA" address="0x00009888" value="0x006C0200" />
+        <register type="NOA" address="0x00009888" value="0x026C000C" />
+        <register type="NOA" address="0x00009888" value="0x1C6C0000" />
+        <register type="NOA" address="0x00009888" value="0x1E6C0000" />
+        <register type="NOA" address="0x00009888" value="0x1A6C0000" />
+        <register type="NOA" address="0x00009888" value="0x0E1BC000" />
+        <register type="NOA" address="0x00009888" value="0x001B8000" />
+        <register type="NOA" address="0x00009888" value="0x021BC000" />
+        <register type="NOA" address="0x00009888" value="0x001C0041" />
+        <register type="NOA" address="0x00009888" value="0x061C4200" />
+        <register type="NOA" address="0x00009888" value="0x081C4443" />
+        <register type="NOA" address="0x00009888" value="0x0A1C4645" />
+        <register type="NOA" address="0x00009888" value="0x0C1C7647" />
+        <register type="NOA" address="0x00009888" value="0x041C7357" />
+        <register type="NOA" address="0x00009888" value="0x1C1C0030" />
+        <register type="NOA" address="0x00009888" value="0x101C0000" />
+        <register type="NOA" address="0x00009888" value="0x1A1C0000" />
+        <register type="NOA" address="0x00009888" value="0x121C8000" />
+        <register type="NOA" address="0x00009888" value="0x004C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4CAA2A" />
+        <register type="NOA" address="0x00009888" value="0x0C4C02AA" />
+        <register type="NOA" address="0x00009888" value="0x084CA000" />
+        <register type="NOA" address="0x00009888" value="0x000DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D8000" />
+        <register type="NOA" address="0x00009888" value="0x080DA000" />
+        <register type="NOA" address="0x00009888" value="0x0A0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0E0DA000" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F5400" />
+        <register type="NOA" address="0x00009888" value="0x0E0F5515" />
+        <register type="NOA" address="0x00009888" value="0x100F0155" />
+        <register type="NOA" address="0x00009888" value="0x002C8000" />
+        <register type="NOA" address="0x00009888" value="0x0E2C8000" />
+        <register type="NOA" address="0x00009888" value="0x162CAA00" />
+        <register type="NOA" address="0x00009888" value="0x182C00AA" />
+        <register type="NOA" address="0x00009888" value="0x022C8000" />
+        <register type="NOA" address="0x00009888" value="0x042C8000" />
+        <register type="NOA" address="0x00009888" value="0x062C8000" />
+        <register type="NOA" address="0x00009888" value="0x082C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x11907FFF" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900040" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900802" />
+        <register type="NOA" address="0x00009888" value="0x47900842" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900842" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900000" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x43900800" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007FC2A" />
+        <register type="OA" address="0x00002774" value="0x0000BF00" />
+        <register type="OA" address="0x00002778" value="0x0007FC6A" />
+        <register type="OA" address="0x0000277C" value="0x0000BF00" />
+        <register type="OA" address="0x00002780" value="0x0007FC92" />
+        <register type="OA" address="0x00002784" value="0x0000BF00" />
+        <register type="OA" address="0x00002788" value="0x0007FCA2" />
+        <register type="OA" address="0x0000278C" value="0x0000BF00" />
+        <register type="OA" address="0x00002790" value="0x0007FC32" />
+        <register type="OA" address="0x00002794" value="0x0000BF00" />
+        <register type="OA" address="0x00002798" value="0x0007FC9A" />
+        <register type="OA" address="0x0000279C" value="0x0000BF00" />
+        <register type="OA" address="0x000027A0" value="0x0007FE6A" />
+        <register type="OA" address="0x000027A4" value="0x0000BF00" />
+        <register type="OA" address="0x000027A8" value="0x0007FE7A" />
+        <register type="OA" address="0x000027AC" value="0x0000BF00" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00000003" />
+        <register type="FLEX" address="0x0000E658" value="0x00002001" />
+        <register type="FLEX" address="0x0000E758" value="0x00778008" />
+        <register type="FLEX" address="0x0000E45C" value="0x00088078" />
+        <register type="FLEX" address="0x0000E55C" value="0x00808708" />
+        <register type="FLEX" address="0x0000E65C" value="0x00A08908" />
+    </register_config>
+  </set>
+
+  <set name="Compute Metrics L3 Cache Gen9"
+       mdapi_supported_apis="VK OGL4 OCL IO BB"
+       underscore_name="compute_l3_cache"
+       hw_config_guid="9fb22842-e708-43f7-9752-e0e41670c39e"
+       chipset="SKLGT2"
+       symbol_name="ComputeL3Cache"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Bank 03 Accesses"
+             description="The total number of accesses to L3 Bank 03."
+             data_type="uint64"
+             equation="B 3 READ 2 UMUL"
+             underscore_name="l3_bank03_accesses"
+             units="messages"
+             symbol_name="L3Bank03Accesses"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="L3 Accesses"
+             description="The total number of L3 accesses from all entities."
+             data_type="uint64"
+             equation="C 0 READ C 1 READ B 2 READ B 3 READ UADD UADD UADD 2 UMUL"
+             underscore_name="l3_accesses"
+             units="messages"
+             symbol_name="L3Accesses"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Sampler Throughput"
+             description="The total number of GPU memory bytes transferred between samplers and L3 caches."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 29 READ 64 UMUL"
+             underscore_name="l3_sampler_throughput"
+             units="bytes"
+             symbol_name="L3SamplerThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Sampler"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu0_active"
+             units="percent"
+             symbol_name="Fpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active"
+             units="percent"
+             symbol_name="Fpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU AVG IPC Rate"
+             description="The average rate of IPC calculated for 2 FPU pipelines."
+             data_type="float"
+             max_equation="2"
+             equation="A 9 READ  A 10 READ  A 11 READ UADD  A 9 READ USUB FDIV 1 FADD"
+             underscore_name="eu_avg_ipc_rate"
+             units="number"
+             symbol_name="EuAvgIpcRate"
+             semantic_type="ratio"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Binary Instruction"
+             description="The percentage of time in which execution units were actively processing binary instructions on FPU0."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_binary_fpu0_instruction"
+             units="percent"
+             symbol_name="EuBinaryFpu0Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="EU FPU0 Hybrid Instruction"
+             description="The percentage of time in which execution units were actively processing hybrid instructions on FPU0."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_hybrid_fpu0_instruction"
+             units="percent"
+             symbol_name="EuHybridFpu0Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Misses"
+             description="The total number of L3 misses."
+             data_type="uint64"
+             equation="C 4 READ C 5 READ UADD"
+             underscore_name="l3_misses"
+             units="messages"
+             symbol_name="L3Misses"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/TAG"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="L3 Bank 00 Accesses"
+             description="The total number of accesses to L3 Bank 00."
+             data_type="uint64"
+             equation="C 0 READ 2 UMUL"
+             underscore_name="l3_bank00_accesses"
+             units="messages"
+             symbol_name="L3Bank00Accesses"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="EU FPU0 Move Instruction"
+             description="The percentage of time in which execution units were actively processing move instructions on FPU0."
+             data_type="float"
+             max_equation="100"
+             equation="A 19 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_move_fpu0_instruction"
+             units="percent"
+             symbol_name="EuMoveFpu0Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU FPU1 Hybrid Instruction"
+             description="The percentage of time in which execution units were actively processing hybrid instructions on FPU1."
+             data_type="float"
+             max_equation="100"
+             equation="A 14 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_hybrid_fpu1_instruction"
+             units="percent"
+             symbol_name="EuHybridFpu1Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Read Throughput"
+             description="The total number of GPU memory bytes read from GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="C 6 READ 64 UMUL"
+             underscore_name="gti_read_throughput"
+             units="bytes"
+             symbol_name="GtiReadThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI L3 Throughput"
+             description="The total number of GPU memory bytes transferred between L3 caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 4 READ C 5 READ UADD 64 UMUL"
+             underscore_name="gti_l3_throughput"
+             units="bytes"
+             symbol_name="GtiL3Throughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Bank 00 IC Accesses"
+             description="The total number of accesses to L3 Bank 00 from IC cache."
+             data_type="uint64"
+             equation="B 0 READ B 1 READ UADD 2 UMUL $L3Bank00Accesses UMIN"
+             underscore_name="l3_bank00_ic_accesses"
+             units="messages"
+             symbol_name="L3Bank00IcAccesses"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3/IC"
+             />
+    <counter name="L3 Bank 00 IC Hits"
+             description="The total number of hits in L3 Bank 00 from IC cache."
+             data_type="uint64"
+             equation="B 1 READ 2 UMUL $L3Bank00IcAccesses UMIN"
+             underscore_name="l3_bank00_ic_hits"
+             units="messages"
+             symbol_name="L3Bank00IcHits"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3/IC"
+             />
+    <counter name="Sampler Accesses"
+             description="The total number of messages send to samplers."
+             data_type="uint64"
+             equation="A 28 READ"
+             underscore_name="sampler_accesses"
+             units="messages"
+             symbol_name="SamplerAccesses"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler"
+             />
+    <counter name="L3 Bank 01 Accesses"
+             description="The total number of accesses to L3 Bank 01."
+             data_type="uint64"
+             equation="C 1 READ 2 UMUL"
+             underscore_name="l3_bank01_accesses"
+             units="messages"
+             symbol_name="L3Bank01Accesses"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Ternary Instruction"
+             description="The percentage of time in which execution units were actively processing ternary instructions on FPU0."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_ternary_fpu0_instruction"
+             units="percent"
+             symbol_name="EuTernaryFpu0Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU FPU1 Move Instruction"
+             description="The percentage of time in which execution units were actively processing move instructions on FPU1."
+             data_type="float"
+             max_equation="100"
+             equation="A 20 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_move_fpu1_instruction"
+             units="percent"
+             symbol_name="EuMoveFpu1Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="L3 Bank 02 Accesses"
+             description="The total number of accesses to L3 Bank 02."
+             data_type="uint64"
+             equation="B 2 READ 2 UMUL"
+             underscore_name="l3_bank02_accesses"
+             units="messages"
+             symbol_name="L3Bank02Accesses"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="L3 Total Throughput"
+             description="The total number of GPU memory bytes transferred via L3."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="$L3Accesses 64 UMUL"
+             underscore_name="l3_total_throughput"
+             units="bytes"
+             symbol_name="L3TotalThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Write Throughput"
+             description="The total number of GPU memory bytes written to GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 32 UMUL"
+             equation="C 7 READ 64 UMUL"
+             underscore_name="gti_write_throughput"
+             units="bytes"
+             symbol_name="GtiWriteThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="EU FPU1 Binary Instruction"
+             description="The percentage of time in which execution units were actively processing binary instructions on FPU1."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_binary_fpu1_instruction"
+             units="percent"
+             symbol_name="EuBinaryFpu1Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Ternary Instruction"
+             description="The percentage of time in which execution units were actively processing ternary instructions on FPU1."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_ternary_fpu1_instruction"
+             units="percent"
+             symbol_name="EuTernaryFpu1Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_send_active"
+             units="percent"
+             symbol_name="EuSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x166C0760" />
+        <register type="NOA" address="0x00009888" value="0x1593001E" />
+        <register type="NOA" address="0x00009888" value="0x3F901403" />
+        <register type="NOA" address="0x00009888" value="0x004E8000" />
+        <register type="NOA" address="0x00009888" value="0x0E4E8000" />
+        <register type="NOA" address="0x00009888" value="0x184E8000" />
+        <register type="NOA" address="0x00009888" value="0x1A4E8020" />
+        <register type="NOA" address="0x00009888" value="0x1C4E0002" />
+        <register type="NOA" address="0x00009888" value="0x006C0051" />
+        <register type="NOA" address="0x00009888" value="0x066C5000" />
+        <register type="NOA" address="0x00009888" value="0x086C5C5D" />
+        <register type="NOA" address="0x00009888" value="0x0E6C5E5F" />
+        <register type="NOA" address="0x00009888" value="0x106C0000" />
+        <register type="NOA" address="0x00009888" value="0x186C0000" />
+        <register type="NOA" address="0x00009888" value="0x1C6C0000" />
+        <register type="NOA" address="0x00009888" value="0x1E6C0000" />
+        <register type="NOA" address="0x00009888" value="0x001B4000" />
+        <register type="NOA" address="0x00009888" value="0x061B8000" />
+        <register type="NOA" address="0x00009888" value="0x081BC000" />
+        <register type="NOA" address="0x00009888" value="0x0E1BC000" />
+        <register type="NOA" address="0x00009888" value="0x101C8000" />
+        <register type="NOA" address="0x00009888" value="0x1A1CE000" />
+        <register type="NOA" address="0x00009888" value="0x1C1C0030" />
+        <register type="NOA" address="0x00009888" value="0x004C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C2A00" />
+        <register type="NOA" address="0x00009888" value="0x0C4C0280" />
+        <register type="NOA" address="0x00009888" value="0x000D2000" />
+        <register type="NOA" address="0x00009888" value="0x060D8000" />
+        <register type="NOA" address="0x00009888" value="0x080DA000" />
+        <register type="NOA" address="0x00009888" value="0x0E0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F0400" />
+        <register type="NOA" address="0x00009888" value="0x0E0F1500" />
+        <register type="NOA" address="0x00009888" value="0x100F0140" />
+        <register type="NOA" address="0x00009888" value="0x002C8000" />
+        <register type="NOA" address="0x00009888" value="0x0E2C8000" />
+        <register type="NOA" address="0x00009888" value="0x162C0A00" />
+        <register type="NOA" address="0x00009888" value="0x182C00A0" />
+        <register type="NOA" address="0x00009888" value="0x03933300" />
+        <register type="NOA" address="0x00009888" value="0x05930032" />
+        <register type="NOA" address="0x00009888" value="0x11930000" />
+        <register type="NOA" address="0x00009888" value="0x1B930000" />
+        <register type="NOA" address="0x00009888" value="0x1D900157" />
+        <register type="NOA" address="0x00009888" value="0x1F900167" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B908000" />
+        <register type="NOA" address="0x00009888" value="0x1190030F" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900000" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900042" />
+        <register type="NOA" address="0x00009888" value="0x47900000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900000" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x53901111" />
+        <register type="NOA" address="0x00009888" value="0x43900420" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x30800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x30800000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007FFFA" />
+        <register type="OA" address="0x00002774" value="0x0000FEFE" />
+        <register type="OA" address="0x00002778" value="0x0007FFFA" />
+        <register type="OA" address="0x0000277C" value="0x0000FEFD" />
+        <register type="OA" address="0x00002790" value="0x0007FFFA" />
+        <register type="OA" address="0x00002794" value="0x0000FBEF" />
+        <register type="OA" address="0x00002798" value="0x0007FFFA" />
+        <register type="OA" address="0x0000279C" value="0x0000FBDF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00000003" />
+        <register type="FLEX" address="0x0000E658" value="0x00002001" />
+        <register type="FLEX" address="0x0000E758" value="0x00101100" />
+        <register type="FLEX" address="0x0000E45C" value="0x00201200" />
+        <register type="FLEX" address="0x0000E55C" value="0x00301300" />
+        <register type="FLEX" address="0x0000E65C" value="0x00401400" />
+    </register_config>
+  </set>
+
+  <set name="Metric set HDCAndSF"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="hdc_and_sf"
+       hw_config_guid="b4aa5e13-2d25-418f-827d-421f5cc4c43b"
+       chipset="SKLGT2"
+       symbol_name="HDCAndSF"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="Polygon Data Ready"
+             description="The percentage of time in which geometry pipeline output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="poly_data_ready"
+             units="percent"
+             symbol_name="PolyDataReady"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe/Strip-Fans"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="HDC stalled by L3 (s0.ss1)"
+             description="Percentage of time when HDC has messges to L3, but it's stalled due to lack of credits (s0.ss1)"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ C 4 READ USUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader01_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader01AccessStalledOnL3"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="HDC stalled by L3 (s0.ss2)"
+             description="Percentage of time when HDC has messges to L3, but it's stalled due to lack of credits (s0.ss2)"
+             data_type="float"
+             max_equation="100"
+             equation="C 3 READ C 2 READ USUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader02_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader02AccessStalledOnL3"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="HDC stalled by L3 (s0.ss0)"
+             description="Percentage of time when HDC has messges to L3, but it's stalled due to lack of credits (s0.ss0)"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ C 6 READ USUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader00_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader00AccessStalledOnL3"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x104F0232" />
+        <register type="NOA" address="0x00009888" value="0x124F4640" />
+        <register type="NOA" address="0x00009888" value="0x106C0232" />
+        <register type="NOA" address="0x00009888" value="0x11834400" />
+        <register type="NOA" address="0x00009888" value="0x0A4E8000" />
+        <register type="NOA" address="0x00009888" value="0x0C4E8000" />
+        <register type="NOA" address="0x00009888" value="0x004F1880" />
+        <register type="NOA" address="0x00009888" value="0x024F08BB" />
+        <register type="NOA" address="0x00009888" value="0x044F001B" />
+        <register type="NOA" address="0x00009888" value="0x046C0100" />
+        <register type="NOA" address="0x00009888" value="0x066C000B" />
+        <register type="NOA" address="0x00009888" value="0x1A6C0000" />
+        <register type="NOA" address="0x00009888" value="0x041B8000" />
+        <register type="NOA" address="0x00009888" value="0x061B4000" />
+        <register type="NOA" address="0x00009888" value="0x1A1C1800" />
+        <register type="NOA" address="0x00009888" value="0x005B8000" />
+        <register type="NOA" address="0x00009888" value="0x025BC000" />
+        <register type="NOA" address="0x00009888" value="0x045B4000" />
+        <register type="NOA" address="0x00009888" value="0x125C8000" />
+        <register type="NOA" address="0x00009888" value="0x145C8000" />
+        <register type="NOA" address="0x00009888" value="0x165C8000" />
+        <register type="NOA" address="0x00009888" value="0x185C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C00A0" />
+        <register type="NOA" address="0x00009888" value="0x000D8000" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F5000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0055" />
+        <register type="NOA" address="0x00009888" value="0x022CC000" />
+        <register type="NOA" address="0x00009888" value="0x042CC000" />
+        <register type="NOA" address="0x00009888" value="0x062CC000" />
+        <register type="NOA" address="0x00009888" value="0x082CC000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0F828000" />
+        <register type="NOA" address="0x00009888" value="0x0F8305C0" />
+        <register type="NOA" address="0x00009888" value="0x09830000" />
+        <register type="NOA" address="0x00009888" value="0x07830000" />
+        <register type="NOA" address="0x00009888" value="0x1D950080" />
+        <register type="NOA" address="0x00009888" value="0x13928000" />
+        <register type="NOA" address="0x00009888" value="0x0F988000" />
+        <register type="NOA" address="0x00009888" value="0x31904000" />
+        <register type="NOA" address="0x00009888" value="0x1190FC00" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x4B9000A0" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900800" />
+        <register type="NOA" address="0x00009888" value="0x43900842" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x10800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00000002" />
+        <register type="OA" address="0x00002774" value="0x0000FDFF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set L3_1"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="l3_1"
+       hw_config_guid="504000e8-64f2-4aac-8301-51b81aa60d45"
+       chipset="SKLGT2"
+       symbol_name="L3_1"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank1 Active"
+             description="The percentage of time in which slice0 L3 bank1 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank1_active"
+             units="percent"
+             symbol_name="L30Bank1Active"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="Slice0 L3 Bank1 Stalled"
+             description="The percentage of time in which slice0 L3 bank1 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank1_stalled"
+             units="percent"
+             symbol_name="L30Bank1Stalled"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank0 Active"
+             description="The percentage of time in which slice0 L3 bank0 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank0_active"
+             units="percent"
+             symbol_name="L30Bank0Active"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank0 Stalled"
+             description="The percentage of time in which slice0 L3 bank0 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank0_stalled"
+             units="percent"
+             symbol_name="L30Bank0Stalled"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x126C7B40" />
+        <register type="NOA" address="0x00009888" value="0x166C0020" />
+        <register type="NOA" address="0x00009888" value="0x0A603444" />
+        <register type="NOA" address="0x00009888" value="0x0A613400" />
+        <register type="NOA" address="0x00009888" value="0x1A4EA800" />
+        <register type="NOA" address="0x00009888" value="0x1C4E0002" />
+        <register type="NOA" address="0x00009888" value="0x024E8000" />
+        <register type="NOA" address="0x00009888" value="0x044E8000" />
+        <register type="NOA" address="0x00009888" value="0x064E8000" />
+        <register type="NOA" address="0x00009888" value="0x084E8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4E8000" />
+        <register type="NOA" address="0x00009888" value="0x064F4000" />
+        <register type="NOA" address="0x00009888" value="0x0C6C5327" />
+        <register type="NOA" address="0x00009888" value="0x0E6C5425" />
+        <register type="NOA" address="0x00009888" value="0x006C2A00" />
+        <register type="NOA" address="0x00009888" value="0x026C285B" />
+        <register type="NOA" address="0x00009888" value="0x046C005C" />
+        <register type="NOA" address="0x00009888" value="0x106C0000" />
+        <register type="NOA" address="0x00009888" value="0x1C6C0000" />
+        <register type="NOA" address="0x00009888" value="0x1E6C0000" />
+        <register type="NOA" address="0x00009888" value="0x1A6C0800" />
+        <register type="NOA" address="0x00009888" value="0x0C1BC000" />
+        <register type="NOA" address="0x00009888" value="0x0E1BC000" />
+        <register type="NOA" address="0x00009888" value="0x001B8000" />
+        <register type="NOA" address="0x00009888" value="0x021BC000" />
+        <register type="NOA" address="0x00009888" value="0x041BC000" />
+        <register type="NOA" address="0x00009888" value="0x1C1C003C" />
+        <register type="NOA" address="0x00009888" value="0x121C8000" />
+        <register type="NOA" address="0x00009888" value="0x141C8000" />
+        <register type="NOA" address="0x00009888" value="0x161C8000" />
+        <register type="NOA" address="0x00009888" value="0x181C8000" />
+        <register type="NOA" address="0x00009888" value="0x1A1C0800" />
+        <register type="NOA" address="0x00009888" value="0x065B4000" />
+        <register type="NOA" address="0x00009888" value="0x1A5C1000" />
+        <register type="NOA" address="0x00009888" value="0x10600000" />
+        <register type="NOA" address="0x00009888" value="0x04600000" />
+        <register type="NOA" address="0x00009888" value="0x0C610044" />
+        <register type="NOA" address="0x00009888" value="0x10610000" />
+        <register type="NOA" address="0x00009888" value="0x06610000" />
+        <register type="NOA" address="0x00009888" value="0x0C4C02A8" />
+        <register type="NOA" address="0x00009888" value="0x084CA000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C002A" />
+        <register type="NOA" address="0x00009888" value="0x0C0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0E0DA000" />
+        <register type="NOA" address="0x00009888" value="0x000D8000" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x100F0154" />
+        <register type="NOA" address="0x00009888" value="0x0C0F5000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0055" />
+        <register type="NOA" address="0x00009888" value="0x182C00AA" />
+        <register type="NOA" address="0x00009888" value="0x022C8000" />
+        <register type="NOA" address="0x00009888" value="0x042C8000" />
+        <register type="NOA" address="0x00009888" value="0x062C8000" />
+        <register type="NOA" address="0x00009888" value="0x082C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C2CC000" />
+        <register type="NOA" address="0x00009888" value="0x1190FFC0" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900420" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900021" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900400" />
+        <register type="NOA" address="0x00009888" value="0x43900421" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900040" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002770" value="0x00100070" />
+        <register type="OA" address="0x00002774" value="0x0000FFF1" />
+        <register type="OA" address="0x00002778" value="0x00014002" />
+        <register type="OA" address="0x0000277C" value="0x0000C3FF" />
+        <register type="OA" address="0x00002780" value="0x00010002" />
+        <register type="OA" address="0x00002784" value="0x0000C7FF" />
+        <register type="OA" address="0x00002788" value="0x00004002" />
+        <register type="OA" address="0x0000278C" value="0x0000D3FF" />
+        <register type="OA" address="0x00002790" value="0x00100700" />
+        <register type="OA" address="0x00002794" value="0x0000FF1F" />
+        <register type="OA" address="0x00002798" value="0x00001402" />
+        <register type="OA" address="0x0000279C" value="0x0000FC3F" />
+        <register type="OA" address="0x000027A0" value="0x00001002" />
+        <register type="OA" address="0x000027A4" value="0x0000FC7F" />
+        <register type="OA" address="0x000027A8" value="0x00000402" />
+        <register type="OA" address="0x000027AC" value="0x0000FD3F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set L3_2"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="l3_2"
+       hw_config_guid="f542479b-6685-4670-ad8e-9fe282a2eb5b"
+       chipset="SKLGT2"
+       symbol_name="L3_2"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank2 Stalled"
+             description="The percentage of time in which slice0 L3 bank2 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank2_stalled"
+             units="percent"
+             symbol_name="L30Bank2Stalled"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank2 Active"
+             description="The percentage of time in which slice0 L3 bank2 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank2_active"
+             units="percent"
+             symbol_name="L30Bank2Active"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x126C02E0" />
+        <register type="NOA" address="0x00009888" value="0x146C0001" />
+        <register type="NOA" address="0x00009888" value="0x0A623400" />
+        <register type="NOA" address="0x00009888" value="0x044E8000" />
+        <register type="NOA" address="0x00009888" value="0x064E8000" />
+        <register type="NOA" address="0x00009888" value="0x084E8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4E8000" />
+        <register type="NOA" address="0x00009888" value="0x064F4000" />
+        <register type="NOA" address="0x00009888" value="0x026C3324" />
+        <register type="NOA" address="0x00009888" value="0x046C3422" />
+        <register type="NOA" address="0x00009888" value="0x106C0000" />
+        <register type="NOA" address="0x00009888" value="0x1A6C0000" />
+        <register type="NOA" address="0x00009888" value="0x021BC000" />
+        <register type="NOA" address="0x00009888" value="0x041BC000" />
+        <register type="NOA" address="0x00009888" value="0x141C8000" />
+        <register type="NOA" address="0x00009888" value="0x161C8000" />
+        <register type="NOA" address="0x00009888" value="0x181C8000" />
+        <register type="NOA" address="0x00009888" value="0x1A1C0800" />
+        <register type="NOA" address="0x00009888" value="0x065B4000" />
+        <register type="NOA" address="0x00009888" value="0x1A5C1000" />
+        <register type="NOA" address="0x00009888" value="0x06614000" />
+        <register type="NOA" address="0x00009888" value="0x0C620044" />
+        <register type="NOA" address="0x00009888" value="0x10620000" />
+        <register type="NOA" address="0x00009888" value="0x06620000" />
+        <register type="NOA" address="0x00009888" value="0x084C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C002A" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F4000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0055" />
+        <register type="NOA" address="0x00009888" value="0x042C8000" />
+        <register type="NOA" address="0x00009888" value="0x062C8000" />
+        <register type="NOA" address="0x00009888" value="0x082C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C2CC000" />
+        <register type="NOA" address="0x00009888" value="0x1190F800" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x43900000" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00100070" />
+        <register type="OA" address="0x00002774" value="0x0000FFF1" />
+        <register type="OA" address="0x00002778" value="0x00028002" />
+        <register type="OA" address="0x0000277C" value="0x000087FF" />
+        <register type="OA" address="0x00002780" value="0x00020002" />
+        <register type="OA" address="0x00002784" value="0x00008FFF" />
+        <register type="OA" address="0x00002788" value="0x00008002" />
+        <register type="OA" address="0x0000278C" value="0x0000A7FF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set L3_3"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="l3_3"
+       hw_config_guid="1cbf1e9f-c2de-4cc2-8d1c-2c33c25a2332"
+       chipset="SKLGT2"
+       symbol_name="L3_3"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Slice0 L3 Bank3 Stalled"
+             description="The percentage of time in which slice0 L3 bank3 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank3_stalled"
+             units="percent"
+             symbol_name="L30Bank3Stalled"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank3 Active"
+             description="The percentage of time in which slice0 L3 bank3 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank3_active"
+             units="percent"
+             symbol_name="L30Bank3Active"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x126C4E80" />
+        <register type="NOA" address="0x00009888" value="0x146C0000" />
+        <register type="NOA" address="0x00009888" value="0x0A633400" />
+        <register type="NOA" address="0x00009888" value="0x044E8000" />
+        <register type="NOA" address="0x00009888" value="0x064E8000" />
+        <register type="NOA" address="0x00009888" value="0x084E8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4E8000" />
+        <register type="NOA" address="0x00009888" value="0x0C4E8000" />
+        <register type="NOA" address="0x00009888" value="0x026C3321" />
+        <register type="NOA" address="0x00009888" value="0x046C342F" />
+        <register type="NOA" address="0x00009888" value="0x106C0000" />
+        <register type="NOA" address="0x00009888" value="0x1A6C2000" />
+        <register type="NOA" address="0x00009888" value="0x021BC000" />
+        <register type="NOA" address="0x00009888" value="0x041BC000" />
+        <register type="NOA" address="0x00009888" value="0x061B4000" />
+        <register type="NOA" address="0x00009888" value="0x141C8000" />
+        <register type="NOA" address="0x00009888" value="0x161C8000" />
+        <register type="NOA" address="0x00009888" value="0x181C8000" />
+        <register type="NOA" address="0x00009888" value="0x1A1C1800" />
+        <register type="NOA" address="0x00009888" value="0x06604000" />
+        <register type="NOA" address="0x00009888" value="0x0C630044" />
+        <register type="NOA" address="0x00009888" value="0x10630000" />
+        <register type="NOA" address="0x00009888" value="0x06630000" />
+        <register type="NOA" address="0x00009888" value="0x084C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C00AA" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F4000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0055" />
+        <register type="NOA" address="0x00009888" value="0x042C8000" />
+        <register type="NOA" address="0x00009888" value="0x062C8000" />
+        <register type="NOA" address="0x00009888" value="0x082C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C2C8000" />
+        <register type="NOA" address="0x00009888" value="0x1190F800" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x43900842" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900002" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00100070" />
+        <register type="OA" address="0x00002774" value="0x0000FFF1" />
+        <register type="OA" address="0x00002778" value="0x00028002" />
+        <register type="OA" address="0x0000277C" value="0x000087FF" />
+        <register type="OA" address="0x00002780" value="0x00020002" />
+        <register type="OA" address="0x00002784" value="0x00008FFF" />
+        <register type="OA" address="0x00002788" value="0x00008002" />
+        <register type="OA" address="0x0000278C" value="0x0000A7FF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set RasterizerAndPixelBackend"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="rasterizer_and_pixel_backend"
+       hw_config_guid="b4e54cc8-a3a0-4ccd-9990-65d3184e5a38"
+       chipset="SKLGT2"
+       symbol_name="RasterizerAndPixelBackend"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Slice0 Pixel Values Ready"
+             description="The percentage of time in which slice0 pixel values are ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="pixel_values0_ready"
+             units="percent"
+             symbol_name="PixelValues0Ready"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="Slice0 Rasterizer Input Available"
+             description="The percentage of time in which slice0 rasterizer input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="rasterizer0_input_available"
+             units="percent"
+             symbol_name="Rasterizer0InputAvailable"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Slice0 Post-EarlyZ Pixel Data Ready"
+             description="The percentage of time in which slice0 post-EarlyZ pixel data is ready (after early Z tests have been applied)"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="pixel_data0_ready"
+             units="percent"
+             symbol_name="PixelData0Ready"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer/Early Depth Test"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 Rasterizer Output Ready"
+             description="The percentage of time in which slice0 rasterizer output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="rasterizer0_output_ready"
+             units="percent"
+             symbol_name="Rasterizer0OutputReady"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Slice0 PS Output Available"
+             description="The percentage of time in which slice0 PS output is available"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_output0_available"
+             units="percent"
+             symbol_name="PSOutput0Available"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x102F3800" />
+        <register type="NOA" address="0x00009888" value="0x144D0500" />
+        <register type="NOA" address="0x00009888" value="0x120D03C0" />
+        <register type="NOA" address="0x00009888" value="0x140D03CF" />
+        <register type="NOA" address="0x00009888" value="0x0C0F0004" />
+        <register type="NOA" address="0x00009888" value="0x0C4E4000" />
+        <register type="NOA" address="0x00009888" value="0x042F0480" />
+        <register type="NOA" address="0x00009888" value="0x082F0000" />
+        <register type="NOA" address="0x00009888" value="0x022F0000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C0090" />
+        <register type="NOA" address="0x00009888" value="0x064D0027" />
+        <register type="NOA" address="0x00009888" value="0x004D0000" />
+        <register type="NOA" address="0x00009888" value="0x000D0D40" />
+        <register type="NOA" address="0x00009888" value="0x020D803F" />
+        <register type="NOA" address="0x00009888" value="0x040D8023" />
+        <register type="NOA" address="0x00009888" value="0x100D0000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x020F0010" />
+        <register type="NOA" address="0x00009888" value="0x000F0000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0050" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C2C8000" />
+        <register type="NOA" address="0x00009888" value="0x1190FC00" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41901400" />
+        <register type="NOA" address="0x00009888" value="0x43901485" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900001" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x30800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00000002" />
+        <register type="OA" address="0x00002774" value="0x0000EFFF" />
+        <register type="OA" address="0x00002778" value="0x00006000" />
+        <register type="OA" address="0x0000277C" value="0x0000F3FF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set Sampler"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="sampler"
+       hw_config_guid="efe7eba4-fd9e-4a09-a92b-334970b5de57"
+       chipset="SKLGT2"
+       symbol_name="Sampler"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 Subslice2 Input Available"
+             description="The percentage of time in which slice0 subslice2 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler02_input_available"
+             units="percent"
+             symbol_name="Sampler02InputAvailable"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 Subslice0 Input Available"
+             description="The percentage of time in which slice0 subslice0 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler00_input_available"
+             units="percent"
+             symbol_name="Sampler00InputAvailable"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="Slice0 Subslice2 Sampler Output Ready"
+             description="The percentage of time in which slice0 subslice2 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler02_output_ready"
+             units="percent"
+             symbol_name="Sampler02OutputReady"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Slice0 Subslice1 Input Available"
+             description="The percentage of time in which slice0 subslice1 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler01_input_available"
+             units="percent"
+             symbol_name="Sampler01InputAvailable"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Slice0 Subslice0 Sampler Output Ready"
+             description="The percentage of time in which slice0 subslice0 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler00_output_ready"
+             units="percent"
+             symbol_name="Sampler00OutputReady"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Slice0 Subslice1 Sampler Output Ready"
+             description="The percentage of time in which slice0 subslice1 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler01_output_ready"
+             units="percent"
+             symbol_name="Sampler01OutputReady"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x14152C00" />
+        <register type="NOA" address="0x00009888" value="0x16150005" />
+        <register type="NOA" address="0x00009888" value="0x121600A0" />
+        <register type="NOA" address="0x00009888" value="0x14352C00" />
+        <register type="NOA" address="0x00009888" value="0x16350005" />
+        <register type="NOA" address="0x00009888" value="0x123600A0" />
+        <register type="NOA" address="0x00009888" value="0x14552C00" />
+        <register type="NOA" address="0x00009888" value="0x16550005" />
+        <register type="NOA" address="0x00009888" value="0x125600A0" />
+        <register type="NOA" address="0x00009888" value="0x062F6000" />
+        <register type="NOA" address="0x00009888" value="0x022F2000" />
+        <register type="NOA" address="0x00009888" value="0x0C4C0050" />
+        <register type="NOA" address="0x00009888" value="0x0A4C0010" />
+        <register type="NOA" address="0x00009888" value="0x0C0D8000" />
+        <register type="NOA" address="0x00009888" value="0x0E0DA000" />
+        <register type="NOA" address="0x00009888" value="0x000D8000" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x100F0350" />
+        <register type="NOA" address="0x00009888" value="0x0C0FB000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F00DA" />
+        <register type="NOA" address="0x00009888" value="0x182C0028" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x022DC000" />
+        <register type="NOA" address="0x00009888" value="0x042D4000" />
+        <register type="NOA" address="0x00009888" value="0x0C138000" />
+        <register type="NOA" address="0x00009888" value="0x0E132000" />
+        <register type="NOA" address="0x00009888" value="0x0413C000" />
+        <register type="NOA" address="0x00009888" value="0x1C140018" />
+        <register type="NOA" address="0x00009888" value="0x0C157000" />
+        <register type="NOA" address="0x00009888" value="0x0E150078" />
+        <register type="NOA" address="0x00009888" value="0x10150000" />
+        <register type="NOA" address="0x00009888" value="0x04162180" />
+        <register type="NOA" address="0x00009888" value="0x02160000" />
+        <register type="NOA" address="0x00009888" value="0x04174000" />
+        <register type="NOA" address="0x00009888" value="0x0233A000" />
+        <register type="NOA" address="0x00009888" value="0x04333000" />
+        <register type="NOA" address="0x00009888" value="0x14348000" />
+        <register type="NOA" address="0x00009888" value="0x16348000" />
+        <register type="NOA" address="0x00009888" value="0x02357870" />
+        <register type="NOA" address="0x00009888" value="0x10350000" />
+        <register type="NOA" address="0x00009888" value="0x04360043" />
+        <register type="NOA" address="0x00009888" value="0x02360000" />
+        <register type="NOA" address="0x00009888" value="0x04371000" />
+        <register type="NOA" address="0x00009888" value="0x0E538000" />
+        <register type="NOA" address="0x00009888" value="0x00538000" />
+        <register type="NOA" address="0x00009888" value="0x06533000" />
+        <register type="NOA" address="0x00009888" value="0x1C540020" />
+        <register type="NOA" address="0x00009888" value="0x12548000" />
+        <register type="NOA" address="0x00009888" value="0x0E557000" />
+        <register type="NOA" address="0x00009888" value="0x00557800" />
+        <register type="NOA" address="0x00009888" value="0x10550000" />
+        <register type="NOA" address="0x00009888" value="0x06560043" />
+        <register type="NOA" address="0x00009888" value="0x02560000" />
+        <register type="NOA" address="0x00009888" value="0x06571000" />
+        <register type="NOA" address="0x00009888" value="0x1190FF80" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900060" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900C00" />
+        <register type="NOA" address="0x00009888" value="0x43900842" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900060" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x70800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x0000C000" />
+        <register type="OA" address="0x00002774" value="0x0000E7FF" />
+        <register type="OA" address="0x00002778" value="0x00003000" />
+        <register type="OA" address="0x0000277C" value="0x0000F9FF" />
+        <register type="OA" address="0x00002780" value="0x00000C00" />
+        <register type="OA" address="0x00002784" value="0x0000FE7F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set TDL_1"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="tdl_1"
+       hw_config_guid="e9bd0bbb-c7b7-4a26-a27a-246987354776"
+       chipset="SKLGT2"
+       symbol_name="TDL_1"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="NonPS Thread Ready For Dispatch on Slice0 Subslice2"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice2 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread02_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread02ReadyForDispatch"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="NonPS Thread Ready For Dispatch on Slice0 Subslice0"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice0 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread00_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread00ReadyForDispatch"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Subslice0"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice0 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread00_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread00ReadyForDispatch"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Subslice1"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice1 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread01_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread01ReadyForDispatch"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Subslice2"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice2 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread02_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread02ReadyForDispatch"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="NonPS Thread Ready For Dispatch on Slice0 Subslice1"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice1 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread01_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread01ReadyForDispatch"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x12120000" />
+        <register type="NOA" address="0x00009888" value="0x12320000" />
+        <register type="NOA" address="0x00009888" value="0x12520000" />
+        <register type="NOA" address="0x00009888" value="0x002F8000" />
+        <register type="NOA" address="0x00009888" value="0x022F3000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C0015" />
+        <register type="NOA" address="0x00009888" value="0x0C0D8000" />
+        <register type="NOA" address="0x00009888" value="0x0E0DA000" />
+        <register type="NOA" address="0x00009888" value="0x000D8000" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x100F03A0" />
+        <register type="NOA" address="0x00009888" value="0x0C0FF000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0095" />
+        <register type="NOA" address="0x00009888" value="0x062C8000" />
+        <register type="NOA" address="0x00009888" value="0x082C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C2D8000" />
+        <register type="NOA" address="0x00009888" value="0x0E2D4000" />
+        <register type="NOA" address="0x00009888" value="0x062D4000" />
+        <register type="NOA" address="0x00009888" value="0x02108000" />
+        <register type="NOA" address="0x00009888" value="0x0410C000" />
+        <register type="NOA" address="0x00009888" value="0x02118000" />
+        <register type="NOA" address="0x00009888" value="0x0411C000" />
+        <register type="NOA" address="0x00009888" value="0x02121880" />
+        <register type="NOA" address="0x00009888" value="0x041219B5" />
+        <register type="NOA" address="0x00009888" value="0x00120000" />
+        <register type="NOA" address="0x00009888" value="0x02134000" />
+        <register type="NOA" address="0x00009888" value="0x04135000" />
+        <register type="NOA" address="0x00009888" value="0x0C308000" />
+        <register type="NOA" address="0x00009888" value="0x0E304000" />
+        <register type="NOA" address="0x00009888" value="0x06304000" />
+        <register type="NOA" address="0x00009888" value="0x0C318000" />
+        <register type="NOA" address="0x00009888" value="0x0E314000" />
+        <register type="NOA" address="0x00009888" value="0x06314000" />
+        <register type="NOA" address="0x00009888" value="0x0C321A80" />
+        <register type="NOA" address="0x00009888" value="0x0E320033" />
+        <register type="NOA" address="0x00009888" value="0x06320031" />
+        <register type="NOA" address="0x00009888" value="0x00320000" />
+        <register type="NOA" address="0x00009888" value="0x0C334000" />
+        <register type="NOA" address="0x00009888" value="0x0E331000" />
+        <register type="NOA" address="0x00009888" value="0x06331000" />
+        <register type="NOA" address="0x00009888" value="0x0E508000" />
+        <register type="NOA" address="0x00009888" value="0x00508000" />
+        <register type="NOA" address="0x00009888" value="0x02504000" />
+        <register type="NOA" address="0x00009888" value="0x0E518000" />
+        <register type="NOA" address="0x00009888" value="0x00518000" />
+        <register type="NOA" address="0x00009888" value="0x02514000" />
+        <register type="NOA" address="0x00009888" value="0x0E521880" />
+        <register type="NOA" address="0x00009888" value="0x00521A80" />
+        <register type="NOA" address="0x00009888" value="0x02520033" />
+        <register type="NOA" address="0x00009888" value="0x0E534000" />
+        <register type="NOA" address="0x00009888" value="0x00534000" />
+        <register type="NOA" address="0x00009888" value="0x02531000" />
+        <register type="NOA" address="0x00009888" value="0x1190FF80" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900800" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900062" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900C00" />
+        <register type="NOA" address="0x00009888" value="0x43900003" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900040" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x30800000" />
+        <register type="OA" address="0x00002770" value="0x00000002" />
+        <register type="OA" address="0x00002774" value="0x00007FFF" />
+        <register type="OA" address="0x00002778" value="0x00000000" />
+        <register type="OA" address="0x0000277C" value="0x00009FFF" />
+        <register type="OA" address="0x00002780" value="0x00000002" />
+        <register type="OA" address="0x00002784" value="0x0000EFFF" />
+        <register type="OA" address="0x00002788" value="0x00000000" />
+        <register type="OA" address="0x0000278C" value="0x0000F3FF" />
+        <register type="OA" address="0x00002790" value="0x00000002" />
+        <register type="OA" address="0x00002794" value="0x0000FDFF" />
+        <register type="OA" address="0x00002798" value="0x00000000" />
+        <register type="OA" address="0x0000279C" value="0x0000FE7F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set TDL_2"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="tdl_2"
+       hw_config_guid="0a7accbf-8c55-455f-9984-23e9fb0b826d"
+       chipset="SKLGT2"
+       symbol_name="TDL_2"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice1 Port 0"
+             description="The percentage of time in which thread header is ready on slice0 subslice1 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header01_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader01ReadyPort0"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice1 Port 1"
+             description="The percentage of time in which thread header is ready on slice0 subslice1 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header01_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader01ReadyPort1"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice2 Port 1"
+             description="The percentage of time in which thread header is ready on slice0 subslice2 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header02_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader02ReadyPort1"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice2 Port 0"
+             description="The percentage of time in which thread header is ready on slice0 subslice2 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header02_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader02ReadyPort0"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice0 Port 0"
+             description="The percentage of time in which thread header is ready on slice0 subslice0 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header00_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader00ReadyPort0"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice0 Port 1"
+             description="The percentage of time in which thread header is ready on slice0 subslice0 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header00_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader00ReadyPort1"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x12124D60" />
+        <register type="NOA" address="0x00009888" value="0x12322E60" />
+        <register type="NOA" address="0x00009888" value="0x12524D60" />
+        <register type="NOA" address="0x00009888" value="0x022F3000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C0014" />
+        <register type="NOA" address="0x00009888" value="0x000D8000" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x0C0FE000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0097" />
+        <register type="NOA" address="0x00009888" value="0x082C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x002D8000" />
+        <register type="NOA" address="0x00009888" value="0x062D4000" />
+        <register type="NOA" address="0x00009888" value="0x0410C000" />
+        <register type="NOA" address="0x00009888" value="0x0411C000" />
+        <register type="NOA" address="0x00009888" value="0x04121FB7" />
+        <register type="NOA" address="0x00009888" value="0x00120000" />
+        <register type="NOA" address="0x00009888" value="0x04135000" />
+        <register type="NOA" address="0x00009888" value="0x00308000" />
+        <register type="NOA" address="0x00009888" value="0x06304000" />
+        <register type="NOA" address="0x00009888" value="0x00318000" />
+        <register type="NOA" address="0x00009888" value="0x06314000" />
+        <register type="NOA" address="0x00009888" value="0x00321B80" />
+        <register type="NOA" address="0x00009888" value="0x0632003F" />
+        <register type="NOA" address="0x00009888" value="0x00334000" />
+        <register type="NOA" address="0x00009888" value="0x06331000" />
+        <register type="NOA" address="0x00009888" value="0x0250C000" />
+        <register type="NOA" address="0x00009888" value="0x0251C000" />
+        <register type="NOA" address="0x00009888" value="0x02521FB7" />
+        <register type="NOA" address="0x00009888" value="0x00520000" />
+        <register type="NOA" address="0x00009888" value="0x02535000" />
+        <register type="NOA" address="0x00009888" value="0x1190FC00" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900800" />
+        <register type="NOA" address="0x00009888" value="0x43900063" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900040" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Compute Metrics Extra Gen9"
+       mdapi_supported_apis="VK OGL4 OCL IO BB"
+       underscore_name="compute_extra"
+       hw_config_guid="41a24047-7484-4ead-ae37-de907e5ff2b2"
+       chipset="SKLGT2"
+       symbol_name="ComputeExtra"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active"
+             units="percent"
+             symbol_name="Fpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Pipe Active including Ext Math"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing including Extended Math processing"
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ  C 7 READ C 6 READ FADD C 5 READ FADD 8 FMUL FADD 100 FMUL $EuCoresTotalCount FDIV $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active_adjusted"
+             units="percent"
+             symbol_name="Fpu1ActiveAdjusted"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x121203E0" />
+        <register type="NOA" address="0x00009888" value="0x123203E0" />
+        <register type="NOA" address="0x00009888" value="0x125203E0" />
+        <register type="NOA" address="0x00009888" value="0x022F4000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C0040" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F006C" />
+        <register type="NOA" address="0x00009888" value="0x0C2C8000" />
+        <register type="NOA" address="0x00009888" value="0x042D8000" />
+        <register type="NOA" address="0x00009888" value="0x06104000" />
+        <register type="NOA" address="0x00009888" value="0x06114000" />
+        <register type="NOA" address="0x00009888" value="0x06120033" />
+        <register type="NOA" address="0x00009888" value="0x00120000" />
+        <register type="NOA" address="0x00009888" value="0x06131000" />
+        <register type="NOA" address="0x00009888" value="0x04308000" />
+        <register type="NOA" address="0x00009888" value="0x04318000" />
+        <register type="NOA" address="0x00009888" value="0x04321980" />
+        <register type="NOA" address="0x00009888" value="0x00320000" />
+        <register type="NOA" address="0x00009888" value="0x04334000" />
+        <register type="NOA" address="0x00009888" value="0x04504000" />
+        <register type="NOA" address="0x00009888" value="0x04514000" />
+        <register type="NOA" address="0x00009888" value="0x04520033" />
+        <register type="NOA" address="0x00009888" value="0x00520000" />
+        <register type="NOA" address="0x00009888" value="0x04531000" />
+        <register type="NOA" address="0x00009888" value="0x1190E000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x43900C00" />
+        <register type="NOA" address="0x00009888" value="0x45900002" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00001000" />
+        <register type="FLEX" address="0x0000E558" value="0x00003002" />
+        <register type="FLEX" address="0x0000E658" value="0x00005004" />
+        <register type="FLEX" address="0x0000E758" value="0x00011010" />
+        <register type="FLEX" address="0x0000E45C" value="0x00050012" />
+        <register type="FLEX" address="0x0000E55C" value="0x00052051" />
+        <register type="FLEX" address="0x0000E65C" value="0x00000008" />
+    </register_config>
+  </set>
+
+  <set name="Media Vme Pipe Gen9"
+       mdapi_supported_apis="MEDIA IO BB"
+       underscore_name="vme_pipe"
+       hw_config_guid="95910492-943f-44bd-9461-390240f243fd"
+       chipset="SKLGT2"
+       symbol_name="VMEPipe"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="EU Thread Occupancy"
+             description="The percentage of time in which hardware threads occupied EUs."
+             data_type="float"
+             max_equation="100"
+             equation="8 A 10 READ FMUL $EuThreadsCount FDIV $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_thread_occupancy"
+             units="percent"
+             symbol_name="EuThreadOccupancy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VME Busy"
+             description="The percentage of time in which VME (IME or CRE) was actively processing data."
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ B 3 READ FADD 2 FDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vme_busy"
+             units="percent"
+             symbol_name="VMEBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Overview System Batch Tier2"
+             mdapi_group="VME Pipe"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x141A5800" />
+        <register type="NOA" address="0x00009888" value="0x161A00C0" />
+        <register type="NOA" address="0x00009888" value="0x12180240" />
+        <register type="NOA" address="0x00009888" value="0x14180002" />
+        <register type="NOA" address="0x00009888" value="0x143A5800" />
+        <register type="NOA" address="0x00009888" value="0x163A00C0" />
+        <register type="NOA" address="0x00009888" value="0x12380240" />
+        <register type="NOA" address="0x00009888" value="0x14380002" />
+        <register type="NOA" address="0x00009888" value="0x002F1000" />
+        <register type="NOA" address="0x00009888" value="0x022F8000" />
+        <register type="NOA" address="0x00009888" value="0x042F3000" />
+        <register type="NOA" address="0x00009888" value="0x004C4000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C1500" />
+        <register type="NOA" address="0x00009888" value="0x000D2000" />
+        <register type="NOA" address="0x00009888" value="0x060D8000" />
+        <register type="NOA" address="0x00009888" value="0x080DA000" />
+        <register type="NOA" address="0x00009888" value="0x0A0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F0400" />
+        <register type="NOA" address="0x00009888" value="0x0E0F9500" />
+        <register type="NOA" address="0x00009888" value="0x100F002A" />
+        <register type="NOA" address="0x00009888" value="0x002C8000" />
+        <register type="NOA" address="0x00009888" value="0x0E2C8000" />
+        <register type="NOA" address="0x00009888" value="0x162C0A00" />
+        <register type="NOA" address="0x00009888" value="0x0A2DC000" />
+        <register type="NOA" address="0x00009888" value="0x0C2DC000" />
+        <register type="NOA" address="0x00009888" value="0x04193000" />
+        <register type="NOA" address="0x00009888" value="0x081A28C1" />
+        <register type="NOA" address="0x00009888" value="0x001A0000" />
+        <register type="NOA" address="0x00009888" value="0x00133000" />
+        <register type="NOA" address="0x00009888" value="0x0613C000" />
+        <register type="NOA" address="0x00009888" value="0x0813F000" />
+        <register type="NOA" address="0x00009888" value="0x00172000" />
+        <register type="NOA" address="0x00009888" value="0x06178000" />
+        <register type="NOA" address="0x00009888" value="0x0817A000" />
+        <register type="NOA" address="0x00009888" value="0x00180037" />
+        <register type="NOA" address="0x00009888" value="0x06180940" />
+        <register type="NOA" address="0x00009888" value="0x08180000" />
+        <register type="NOA" address="0x00009888" value="0x02180000" />
+        <register type="NOA" address="0x00009888" value="0x04183000" />
+        <register type="NOA" address="0x00009888" value="0x06393000" />
+        <register type="NOA" address="0x00009888" value="0x0C3A28C1" />
+        <register type="NOA" address="0x00009888" value="0x003A0000" />
+        <register type="NOA" address="0x00009888" value="0x0A33F000" />
+        <register type="NOA" address="0x00009888" value="0x0C33F000" />
+        <register type="NOA" address="0x00009888" value="0x0A37A000" />
+        <register type="NOA" address="0x00009888" value="0x0C37A000" />
+        <register type="NOA" address="0x00009888" value="0x0A380977" />
+        <register type="NOA" address="0x00009888" value="0x08380000" />
+        <register type="NOA" address="0x00009888" value="0x04380000" />
+        <register type="NOA" address="0x00009888" value="0x06383000" />
+        <register type="NOA" address="0x00009888" value="0x119000FF" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900040" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900800" />
+        <register type="NOA" address="0x00009888" value="0x47901000" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900844" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x30800000" />
+        <register type="OA" address="0x00002770" value="0x00100030" />
+        <register type="OA" address="0x00002774" value="0x0000FFF9" />
+        <register type="OA" address="0x00002778" value="0x00000002" />
+        <register type="OA" address="0x0000277C" value="0x0000FFFC" />
+        <register type="OA" address="0x00002780" value="0x00000002" />
+        <register type="OA" address="0x00002784" value="0x0000FFF3" />
+        <register type="OA" address="0x00002788" value="0x00100180" />
+        <register type="OA" address="0x0000278C" value="0x0000FFCF" />
+        <register type="OA" address="0x00002790" value="0x00000002" />
+        <register type="OA" address="0x00002794" value="0x0000FFCF" />
+        <register type="OA" address="0x00002798" value="0x00000002" />
+        <register type="OA" address="0x0000279C" value="0x0000FF3F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00008003" />
+    </register_config>
+  </set>
+
+  <set name="Gpu Rings Busyness"
+       mdapi_supported_apis="VK OGL OCL MEDIA IO BB"
+       underscore_name="gpu_busyness"
+       hw_config_guid="c44a5cf7-886d-477b-bebd-2d738923e4c3"
+       chipset="SKLGT2"
+       symbol_name="GpuBusyness"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="Vebox Ring Busy"
+             description="The percentage of time when vebox command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vebox_busy"
+             units="percent"
+             symbol_name="VeboxBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Render Ring Busy"
+             description="The percentage of time when render command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="render_busy"
+             units="percent"
+             symbol_name="RenderBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Vdbox0 Ring Busy"
+             description="The percentage of time when Vdbox0 command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vdbox0_busy"
+             units="percent"
+             symbol_name="Vdbox0Busy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Blitter Ring Busy"
+             description="The percentage of time when blitter command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="blitter_busy"
+             units="percent"
+             symbol_name="BlitterBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="AnyRingBusy"
+             description="The percentage of time when any command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="any_ring_busy"
+             units="percent"
+             symbol_name="AnyRingBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x13805800" />
+        <register type="NOA" address="0x00009888" value="0x05962C00" />
+        <register type="NOA" address="0x00009888" value="0x19950016" />
+        <register type="NOA" address="0x00009888" value="0x21C05800" />
+        <register type="NOA" address="0x00009888" value="0x07800035" />
+        <register type="NOA" address="0x00009888" value="0x11800000" />
+        <register type="NOA" address="0x00009888" value="0x1D810400" />
+        <register type="NOA" address="0x00009888" value="0x07960025" />
+        <register type="NOA" address="0x00009888" value="0x21960000" />
+        <register type="NOA" address="0x00009888" value="0x0B964000" />
+        <register type="NOA" address="0x00009888" value="0x1B930062" />
+        <register type="NOA" address="0x00009888" value="0x17948000" />
+        <register type="NOA" address="0x00009888" value="0x1B940008" />
+        <register type="NOA" address="0x00009888" value="0x05950075" />
+        <register type="NOA" address="0x00009888" value="0x1D950000" />
+        <register type="NOA" address="0x00009888" value="0x07E54000" />
+        <register type="NOA" address="0x00009888" value="0x09924000" />
+        <register type="NOA" address="0x00009888" value="0x05982000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B904000" />
+        <register type="NOA" address="0x00009888" value="0x1D908000" />
+        <register type="NOA" address="0x00009888" value="0x1F908000" />
+        <register type="NOA" address="0x00009888" value="0x09978000" />
+        <register type="NOA" address="0x00009888" value="0x0BC000A5" />
+        <register type="NOA" address="0x00009888" value="0x11C00000" />
+        <register type="NOA" address="0x00009888" value="0x05C00000" />
+        <register type="NOA" address="0x00009888" value="0x0BC54000" />
+        <register type="NOA" address="0x00009888" value="0x11900000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x43900C60" />
+        <register type="NOA" address="0x00009888" value="0x45900040" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x10800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00078000" />
+        <register type="OA" address="0x00002774" value="0x00000FFF" />
+    </register_config>
+  </set>
+
+  <set name="FF Bottlenecks"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="ff_bottlenecks"
+       hw_config_guid="e0b2aae4-9b8f-4211-8df0-f8e8cb203209"
+       chipset="SKLGT2"
+       symbol_name="FfBottlenecks"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS is sending vertices to CL"
+             description="The percentage of time in which VS is sending vertices to CL bypassing other pipeline stages."
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ B 4 READ FADD 2 FDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_cl_bypass"
+             units="percent"
+             symbol_name="VsClBypass"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw Tier3"
+             mdapi_group="3D Pipe/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 14 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HS Bottleneck"
+             low_watermark="3"
+             description="The percentage of time in which hull shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="9"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="hs_bottleneck"
+             units="percent"
+             symbol_name="HsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Hull Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="DS Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which domain shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="B 1 READ B 5 READ FADD 2 FDIV 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="ds_bottleneck"
+             units="percent"
+             symbol_name="DsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Domain Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="TE Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which tesselation pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="B 2 READ B 6 READ FADD 2 FDIV 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="te_bottleneck"
+             units="percent"
+             symbol_name="TeBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Geometry Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="GS Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which geometry shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="B 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="gs_bottleneck"
+             units="percent"
+             symbol_name="GsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Geometry Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="EU Thread Occupancy"
+             description="The percentage of time in which hardware threads occupied EUs."
+             data_type="float"
+             max_equation="100"
+             equation="8 A 17 READ FMUL $EuThreadsCount FDIV $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_thread_occupancy"
+             units="percent"
+             symbol_name="EuThreadOccupancy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x11850019" />
+        <register type="NOA" address="0x00009888" value="0x11860007" />
+        <register type="NOA" address="0x00009888" value="0x19867C00" />
+        <register type="NOA" address="0x00009888" value="0x01870000" />
+        <register type="NOA" address="0x00009888" value="0x15880000" />
+        <register type="NOA" address="0x00009888" value="0x01898000" />
+        <register type="NOA" address="0x00009888" value="0x0B898000" />
+        <register type="NOA" address="0x00009888" value="0x0D890C00" />
+        <register type="NOA" address="0x00009888" value="0x0D808000" />
+        <register type="NOA" address="0x00009888" value="0x118A8000" />
+        <register type="NOA" address="0x00009888" value="0x1B8A2000" />
+        <register type="NOA" address="0x00009888" value="0x1D8A0003" />
+        <register type="NOA" address="0x00009888" value="0x1F810002" />
+        <register type="NOA" address="0x00009888" value="0x0982C000" />
+        <register type="NOA" address="0x00009888" value="0x0D824000" />
+        <register type="NOA" address="0x00009888" value="0x05833000" />
+        <register type="NOA" address="0x00009888" value="0x07831000" />
+        <register type="NOA" address="0x00009888" value="0x0D848000" />
+        <register type="NOA" address="0x00009888" value="0x0D850080" />
+        <register type="NOA" address="0x00009888" value="0x01850000" />
+        <register type="NOA" address="0x00009888" value="0x09860080" />
+        <register type="NOA" address="0x00009888" value="0x0D860080" />
+        <register type="NOA" address="0x00009888" value="0x07870C80" />
+        <register type="NOA" address="0x00009888" value="0x0B870C80" />
+        <register type="NOA" address="0x00009888" value="0x01880032" />
+        <register type="NOA" address="0x00009888" value="0x0B888032" />
+        <register type="NOA" address="0x00009888" value="0x11880000" />
+        <register type="NOA" address="0x00009888" value="0x07888000" />
+        <register type="NOA" address="0x00009888" value="0x1D930010" />
+        <register type="NOA" address="0x00009888" value="0x1D950013" />
+        <register type="NOA" address="0x00009888" value="0x0DE58000" />
+        <register type="NOA" address="0x00009888" value="0x05924000" />
+        <register type="NOA" address="0x00009888" value="0x0B928000" />
+        <register type="NOA" address="0x00009888" value="0x0D92C000" />
+        <register type="NOA" address="0x00009888" value="0x0F92C000" />
+        <register type="NOA" address="0x00009888" value="0x11928000" />
+        <register type="NOA" address="0x00009888" value="0x01981000" />
+        <register type="NOA" address="0x00009888" value="0x07984000" />
+        <register type="NOA" address="0x00009888" value="0x0998A000" />
+        <register type="NOA" address="0x00009888" value="0x0B985000" />
+        <register type="NOA" address="0x00009888" value="0x0D982000" />
+        <register type="NOA" address="0x00009888" value="0x13904000" />
+        <register type="NOA" address="0x00009888" value="0x21904000" />
+        <register type="NOA" address="0x00009888" value="0x23904000" />
+        <register type="NOA" address="0x00009888" value="0x25904000" />
+        <register type="NOA" address="0x00009888" value="0x27904000" />
+        <register type="NOA" address="0x00009888" value="0x29904000" />
+        <register type="NOA" address="0x00009888" value="0x2B904000" />
+        <register type="NOA" address="0x00009888" value="0x2D908000" />
+        <register type="NOA" address="0x00009888" value="0x11900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900020" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900000" />
+        <register type="NOA" address="0x00009888" value="0x47900400" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00000011" />
+        <register type="FLEX" address="0x0000E758" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00000008" />
+    </register_config>
+  </set>
+
+  <set name="MDAPI testing set Gen9"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="test_oa"
+       hw_config_guid="1651949f-0ac0-4cb1-a06f-dafd74a407d1"
+       chipset="SKLGT2"
+       symbol_name="TestOa"
+       >
+    <counter name="TestCounter7"
+             description="HW test counter 7. Factor: 0.666"
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="counter7"
+             units="events"
+             symbol_name="Counter7"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="TestCounter8"
+             description="HW test counter 8. Should be equal to 1."
+             data_type="uint64"
+             equation="C 7 READ"
+             underscore_name="counter8"
+             units="events"
+             symbol_name="Counter8"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter4"
+             description="HW test counter 4. Factor: 0.333"
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="counter4"
+             units="events"
+             symbol_name="Counter4"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter5"
+             description="HW test counter 5. Factor: 0.333"
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="counter5"
+             units="events"
+             symbol_name="Counter5"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter6"
+             description="HW test counter 6. Factor: 0.166"
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="counter6"
+             units="events"
+             symbol_name="Counter6"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter3"
+             description="HW test counter 3. Factor: 0.5"
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="counter3"
+             units="events"
+             symbol_name="Counter3"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter0"
+             description="HW test counter 0. Factor: 0.0"
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="counter0"
+             units="events"
+             symbol_name="Counter0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter1"
+             description="HW test counter 1. Factor: 1.0"
+             data_type="uint64"
+             equation="B 1 READ"
+             underscore_name="counter1"
+             units="events"
+             symbol_name="Counter1"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter2"
+             description="HW test counter 2. Factor: 1.0"
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="counter2"
+             units="events"
+             symbol_name="Counter2"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x11810000" />
+        <register type="NOA" address="0x00009888" value="0x07810016" />
+        <register type="NOA" address="0x00009888" value="0x1F810000" />
+        <register type="NOA" address="0x00009888" value="0x1D810000" />
+        <register type="NOA" address="0x00009888" value="0x1B930040" />
+        <register type="NOA" address="0x00009888" value="0x07E54000" />
+        <register type="NOA" address="0x00009888" value="0x1F908000" />
+        <register type="NOA" address="0x00009888" value="0x11900000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x00000004" />
+        <register type="OA" address="0x00002774" value="0x00000000" />
+        <register type="OA" address="0x00002778" value="0x00000003" />
+        <register type="OA" address="0x0000277C" value="0x00000000" />
+        <register type="OA" address="0x00002780" value="0x00000007" />
+        <register type="OA" address="0x00002784" value="0x00000000" />
+        <register type="OA" address="0x00002788" value="0x00100002" />
+        <register type="OA" address="0x0000278C" value="0x0000FFF7" />
+        <register type="OA" address="0x00002790" value="0x00100002" />
+        <register type="OA" address="0x00002794" value="0x0000FFCF" />
+        <register type="OA" address="0x00002798" value="0x00100082" />
+        <register type="OA" address="0x0000279C" value="0x0000FFEF" />
+        <register type="OA" address="0x000027A0" value="0x001000C2" />
+        <register type="OA" address="0x000027A4" value="0x0000FFE7" />
+        <register type="OA" address="0x000027A8" value="0x00100001" />
+        <register type="OA" address="0x000027AC" value="0x0000FFE7" />
+    </register_config>
+  </set>
+
+  <set name="Metric set PMA Stall"
+       mdapi_supported_apis="VK OGL OGL4 OCL IO MEDIA"
+       underscore_name="pma__stall"
+       hw_config_guid="27871149-2fa9-40ba-aa73-350d60c03a09"
+       chipset="SKLGT2"
+       symbol_name="PMA_Stall"
+       >
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="STC PMA stall"
+             description="Percentage of time when stencil cache line and an overlapping pixel are causing stalls"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ B 1 READ FADD 2 FDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="stc_pma_stall"
+             units="percent"
+             symbol_name="StcPMAStall"
+             availability="$SliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_group="GPU/Stencil Cache"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x122D3080" />
+        <register type="NOA" address="0x00009888" value="0x000D2000" />
+        <register type="NOA" address="0x00009888" value="0x060D8000" />
+        <register type="NOA" address="0x00009888" value="0x080DA000" />
+        <register type="NOA" address="0x00009888" value="0x0A0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F0800" />
+        <register type="NOA" address="0x00009888" value="0x0E0FAA00" />
+        <register type="NOA" address="0x00009888" value="0x100F0002" />
+        <register type="NOA" address="0x00009888" value="0x002D0025" />
+        <register type="NOA" address="0x00009888" value="0x062D1300" />
+        <register type="NOA" address="0x00009888" value="0x082D16A4" />
+        <register type="NOA" address="0x00009888" value="0x0A2D162E" />
+        <register type="NOA" address="0x00009888" value="0x102D0000" />
+        <register type="NOA" address="0x00009888" value="0x1190003F" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900000" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900000" />
+        <register type="NOA" address="0x00009888" value="0x47900000" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x30800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00E00021" />
+        <register type="OA" address="0x00002774" value="0x0007FFF8" />
+        <register type="OA" address="0x00002778" value="0x07000101" />
+        <register type="OA" address="0x0000277C" value="0x0038FFC7" />
+    </register_config>
+  </set>
+
+</metrics>
diff --git a/lib/i915/perf-configs/oa-sklgt3.xml b/lib/i915/perf-configs/oa-sklgt3.xml
new file mode 100644
index 00000000..1b511729
--- /dev/null
+++ b/lib/i915/perf-configs/oa-sklgt3.xml
@@ -0,0 +1,10933 @@
+<?xml version="1.0"?>
+<metrics version="1581935518" merge_md5="">
+  <set name="Render Metrics Basic Gen9"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="render_basic"
+       hw_config_guid="21fef15a-83f4-4ffa-bb81-7da6e38b8e4b"
+       chipset="SKLGT3"
+       symbol_name="RenderBasic"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Misses"
+             description="The total number of L3 misses."
+             data_type="uint64"
+             equation="C 4 READ"
+             underscore_name="l3_misses"
+             units="messages"
+             symbol_name="L3Misses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/TAG"
+             />
+    <counter name="GTI L3 Throughput"
+             description="The total number of GPU memory bytes transferred between L3 caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="$L3Misses 64 UMUL"
+             underscore_name="gti_l3_throughput"
+             units="bytes"
+             symbol_name="GtiL3Throughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Cache Misses"
+             description="The total number of sampler cache misses in all LODs in all sampler units."
+             data_type="uint64"
+             equation="B 4 READ B 5 READ UADD 8 UMUL"
+             underscore_name="sampler_l1_misses"
+             units="messages"
+             symbol_name="SamplerL1Misses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler 1 Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which Sampler 1 has been slowing down the pipe when processing EU requests."
+             data_type="float"
+             high_watermark="15"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="sampler1_bottleneck"
+             units="percent"
+             symbol_name="Sampler1Bottleneck"
+             availability="$SubsliceMask 0x12 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="L3 Sampler Throughput"
+             description="The total number of GPU memory bytes transferred between samplers and L3 caches."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="$SamplerL1Misses 64 UMUL"
+             underscore_name="l3_sampler_throughput"
+             units="bytes"
+             symbol_name="L3SamplerThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Sampler"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Sampler 0 Busy"
+             description="The percentage of time in which Sampler 0 has been processing EU requests."
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler0_busy"
+             units="percent"
+             symbol_name="Sampler0Busy"
+             availability="$SubsliceMask 0x09 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Sampler 1 Busy"
+             description="The percentage of time in which Sampler 1 has been processing EU requests."
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler1_busy"
+             units="percent"
+             symbol_name="Sampler1Busy"
+             availability="$SubsliceMask 0x12 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Samplers Busy"
+             description="The percentage of time in which samplers have been processing EU requests."
+             data_type="float"
+             max_equation="100"
+             equation="$Sampler0Busy $Sampler1Busy FMAX"
+             underscore_name="samplers_busy"
+             units="percent"
+             symbol_name="SamplersBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="GTI Fixed Pipe Throughput"
+             description="The total number of GPU memory bytes transferred between 3D Pipeline (Command Dispatch, Input Assembly and Stream Output) and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="B 6 READ B 7 READ UADD 64 UMUL"
+             underscore_name="gti_vf_throughput"
+             units="bytes"
+             symbol_name="GtiVfThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/3D Pipe"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler 0 Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which Sampler 0 has been slowing down the pipe when processing EU requests."
+             data_type="float"
+             high_watermark="15"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="sampler0_bottleneck"
+             units="percent"
+             symbol_name="Sampler0Bottleneck"
+             availability="$SubsliceMask 0x09 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="L3 Lookup Accesses w/o IC"
+             description="The total number of L3 cache lookup accesses w/o IC."
+             data_type="uint64"
+             equation="$SamplerL1Misses $ShaderMemoryAccesses UADD"
+             underscore_name="l3_lookups"
+             units="messages"
+             symbol_name="L3Lookups"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/TAG"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Read Throughput"
+             description="The total number of GPU memory bytes read from GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="C 6 READ 64 UMUL"
+             underscore_name="gti_read_throughput"
+             units="bytes"
+             symbol_name="GtiReadThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Depth Throughput"
+             description="The total number of GPU memory bytes transferred between depth caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 0 READ C 1 READ UADD 64 UMUL"
+             underscore_name="gti_depth_throughput"
+             units="bytes"
+             symbol_name="GtiDepthThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/Depth Cache"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Samplers Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which samplers have been slowing down the pipe when processing EU requests."
+             data_type="float"
+             high_watermark="15"
+             equation="$Sampler0Bottleneck $Sampler1Bottleneck FMAX"
+             max_equation="100"
+             underscore_name="sampler_bottleneck"
+             units="percent"
+             symbol_name="SamplerBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Indicate System Frame Batch Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="GTI HDC TLB Lookup Throughput"
+             description="The total number of GPU memory bytes transferred between GTI and HDC, when HDC is doing TLB lookups."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 5 READ 64 UMUL"
+             underscore_name="gti_hdc_lookups_throughput"
+             units="bytes"
+             symbol_name="GtiHdcLookupsThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI RCC Throughput"
+             description="The total number of GPU memory bytes transferred between render color caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 2 READ C 3 READ UADD 64 UMUL"
+             underscore_name="gti_rcc_throughput"
+             units="bytes"
+             symbol_name="GtiRccThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/Color Cache"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="GTI Write Throughput"
+             description="The total number of GPU memory bytes written to GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 32 UMUL"
+             equation="C 7 READ 64 UMUL"
+             underscore_name="gti_write_throughput"
+             units="bytes"
+             symbol_name="GtiWriteThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x166C01E0" />
+        <register type="NOA" address="0x00009888" value="0x12170280" />
+        <register type="NOA" address="0x00009888" value="0x12370280" />
+        <register type="NOA" address="0x00009888" value="0x16EC01E0" />
+        <register type="NOA" address="0x00009888" value="0x11930317" />
+        <register type="NOA" address="0x00009888" value="0x159303DF" />
+        <register type="NOA" address="0x00009888" value="0x3F900003" />
+        <register type="NOA" address="0x00009888" value="0x1A4E0380" />
+        <register type="NOA" address="0x00009888" value="0x0A6C0053" />
+        <register type="NOA" address="0x00009888" value="0x106C0000" />
+        <register type="NOA" address="0x00009888" value="0x1C6C0000" />
+        <register type="NOA" address="0x00009888" value="0x0A1B4000" />
+        <register type="NOA" address="0x00009888" value="0x1C1C0001" />
+        <register type="NOA" address="0x00009888" value="0x002F1000" />
+        <register type="NOA" address="0x00009888" value="0x042F1000" />
+        <register type="NOA" address="0x00009888" value="0x004C4000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C8400" />
+        <register type="NOA" address="0x00009888" value="0x0C4C0002" />
+        <register type="NOA" address="0x00009888" value="0x000D2000" />
+        <register type="NOA" address="0x00009888" value="0x060D8000" />
+        <register type="NOA" address="0x00009888" value="0x080DA000" />
+        <register type="NOA" address="0x00009888" value="0x0A0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F0400" />
+        <register type="NOA" address="0x00009888" value="0x0E0F6600" />
+        <register type="NOA" address="0x00009888" value="0x100F0001" />
+        <register type="NOA" address="0x00009888" value="0x002C8000" />
+        <register type="NOA" address="0x00009888" value="0x162CA200" />
+        <register type="NOA" address="0x00009888" value="0x062D8000" />
+        <register type="NOA" address="0x00009888" value="0x082D8000" />
+        <register type="NOA" address="0x00009888" value="0x00133000" />
+        <register type="NOA" address="0x00009888" value="0x08133000" />
+        <register type="NOA" address="0x00009888" value="0x00170020" />
+        <register type="NOA" address="0x00009888" value="0x08170021" />
+        <register type="NOA" address="0x00009888" value="0x10170000" />
+        <register type="NOA" address="0x00009888" value="0x0633C000" />
+        <register type="NOA" address="0x00009888" value="0x0833C000" />
+        <register type="NOA" address="0x00009888" value="0x06370800" />
+        <register type="NOA" address="0x00009888" value="0x08370840" />
+        <register type="NOA" address="0x00009888" value="0x10370000" />
+        <register type="NOA" address="0x00009888" value="0x1ACE0200" />
+        <register type="NOA" address="0x00009888" value="0x0AEC5300" />
+        <register type="NOA" address="0x00009888" value="0x10EC0000" />
+        <register type="NOA" address="0x00009888" value="0x1CEC0000" />
+        <register type="NOA" address="0x00009888" value="0x0A9B8000" />
+        <register type="NOA" address="0x00009888" value="0x1C9C0002" />
+        <register type="NOA" address="0x00009888" value="0x0CCC0002" />
+        <register type="NOA" address="0x00009888" value="0x0A8D8000" />
+        <register type="NOA" address="0x00009888" value="0x108F0001" />
+        <register type="NOA" address="0x00009888" value="0x16AC8000" />
+        <register type="NOA" address="0x00009888" value="0x0D933031" />
+        <register type="NOA" address="0x00009888" value="0x0F933E3F" />
+        <register type="NOA" address="0x00009888" value="0x01933D00" />
+        <register type="NOA" address="0x00009888" value="0x0393073C" />
+        <register type="NOA" address="0x00009888" value="0x0593000E" />
+        <register type="NOA" address="0x00009888" value="0x1D930000" />
+        <register type="NOA" address="0x00009888" value="0x19930000" />
+        <register type="NOA" address="0x00009888" value="0x1B930000" />
+        <register type="NOA" address="0x00009888" value="0x1D900157" />
+        <register type="NOA" address="0x00009888" value="0x1F900158" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x2B908000" />
+        <register type="NOA" address="0x00009888" value="0x2D908000" />
+        <register type="NOA" address="0x00009888" value="0x2F908000" />
+        <register type="NOA" address="0x00009888" value="0x31908000" />
+        <register type="NOA" address="0x00009888" value="0x15908000" />
+        <register type="NOA" address="0x00009888" value="0x17908000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B908000" />
+        <register type="NOA" address="0x00009888" value="0x1190003F" />
+        <register type="NOA" address="0x00009888" value="0x51907710" />
+        <register type="NOA" address="0x00009888" value="0x419020A0" />
+        <register type="NOA" address="0x00009888" value="0x55901515" />
+        <register type="NOA" address="0x00009888" value="0x45900529" />
+        <register type="NOA" address="0x00009888" value="0x47901025" />
+        <register type="NOA" address="0x00009888" value="0x57907770" />
+        <register type="NOA" address="0x00009888" value="0x49902100" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900108" />
+        <register type="NOA" address="0x00009888" value="0x59900007" />
+        <register type="NOA" address="0x00009888" value="0x43902108" />
+        <register type="NOA" address="0x00009888" value="0x53907777" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00222222" />
+    </register_config>
+  </set>
+
+  <set name="Compute Metrics Basic Gen9"
+       mdapi_supported_apis="VK OGL4 OCL IO BB"
+       underscore_name="compute_basic"
+       hw_config_guid="4320492b-fd03-42ac-922f-dbe1ef3b7b58"
+       chipset="SKLGT3"
+       symbol_name="ComputeBasic"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Untyped Bytes Read"
+             description="The total number of typed memory bytes read via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="B 6 READ B 7 READ C 0 READ UADD UADD $EuSlicesTotalCount 64 UMUL UMUL"
+             underscore_name="untyped_bytes_read"
+             units="bytes"
+             symbol_name="UntypedBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Typed Bytes Written"
+             description="The total number of untyped memory bytes written via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="B 3 READ B 4 READ B 5 READ UADD UADD $EuSlicesTotalCount 64 UMUL UMUL"
+             underscore_name="typed_bytes_written"
+             units="bytes"
+             symbol_name="TypedBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu0_active"
+             units="percent"
+             symbol_name="Fpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active"
+             units="percent"
+             symbol_name="Fpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO OCL BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU AVG IPC Rate"
+             description="The average rate of IPC calculated for 2 FPU pipelines."
+             data_type="float"
+             max_equation="2"
+             equation="A 9 READ  A 10 READ  A 11 READ UADD  A 9 READ USUB FDIV 1 FADD"
+             underscore_name="eu_avg_ipc_rate"
+             units="number"
+             symbol_name="EuAvgIpcRate"
+             semantic_type="ratio"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO OCL BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO OCL BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Read Throughput"
+             description="The total number of GPU memory bytes read from GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 4 READ 64 UMUL"
+             underscore_name="gti_read_throughput"
+             units="bytes"
+             symbol_name="GtiReadThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Untyped Writes"
+             description="The total number of untyped memory bytes written via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 1 READ C 2 READ C 3 READ UADD UADD $EuSlicesTotalCount 64 UMUL UMUL"
+             underscore_name="untyped_bytes_written"
+             units="bytes"
+             symbol_name="UntypedBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO OCL BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="Typed Bytes Read"
+             description="The total number of typed memory bytes read via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="B 0 READ B 1 READ B 2 READ UADD UADD $EuSlicesTotalCount 64 UMUL UMUL"
+             underscore_name="typed_bytes_read"
+             units="bytes"
+             symbol_name="TypedBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="EU Thread Occupancy"
+             description="The percentage of time in which hardware threads occupied EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ 8 UMUL $EuCoresTotalCount UDIV $EuThreadsCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_thread_occupancy"
+             units="percent"
+             symbol_name="EuThreadOccupancy"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO OCL BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO OCL BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO OCL BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="GTI Write Throughput"
+             description="The total number of GPU memory bytes written to GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 32 UMUL"
+             equation="C 5 READ 64 UMUL"
+             underscore_name="gti_write_throughput"
+             units="bytes"
+             symbol_name="GtiWriteThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO OCL BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO OCL BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="EU Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_send_active"
+             units="percent"
+             symbol_name="EuSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO OCL BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x104F00E0" />
+        <register type="NOA" address="0x00009888" value="0x124F1C00" />
+        <register type="NOA" address="0x00009888" value="0x106C00E0" />
+        <register type="NOA" address="0x00009888" value="0x37906800" />
+        <register type="NOA" address="0x00009888" value="0x3F900003" />
+        <register type="NOA" address="0x00009888" value="0x004E8000" />
+        <register type="NOA" address="0x00009888" value="0x1A4E0820" />
+        <register type="NOA" address="0x00009888" value="0x1C4E0002" />
+        <register type="NOA" address="0x00009888" value="0x064F0900" />
+        <register type="NOA" address="0x00009888" value="0x084F0032" />
+        <register type="NOA" address="0x00009888" value="0x0A4F1891" />
+        <register type="NOA" address="0x00009888" value="0x0C4F0E00" />
+        <register type="NOA" address="0x00009888" value="0x0E4F003C" />
+        <register type="NOA" address="0x00009888" value="0x004F0D80" />
+        <register type="NOA" address="0x00009888" value="0x024F003B" />
+        <register type="NOA" address="0x00009888" value="0x006C0002" />
+        <register type="NOA" address="0x00009888" value="0x086C0100" />
+        <register type="NOA" address="0x00009888" value="0x0C6C000C" />
+        <register type="NOA" address="0x00009888" value="0x0E6C0B00" />
+        <register type="NOA" address="0x00009888" value="0x186C0000" />
+        <register type="NOA" address="0x00009888" value="0x1C6C0000" />
+        <register type="NOA" address="0x00009888" value="0x1E6C0000" />
+        <register type="NOA" address="0x00009888" value="0x001B4000" />
+        <register type="NOA" address="0x00009888" value="0x081B8000" />
+        <register type="NOA" address="0x00009888" value="0x0C1B4000" />
+        <register type="NOA" address="0x00009888" value="0x0E1B8000" />
+        <register type="NOA" address="0x00009888" value="0x101C8000" />
+        <register type="NOA" address="0x00009888" value="0x1A1C8000" />
+        <register type="NOA" address="0x00009888" value="0x1C1C0024" />
+        <register type="NOA" address="0x00009888" value="0x065B8000" />
+        <register type="NOA" address="0x00009888" value="0x085B4000" />
+        <register type="NOA" address="0x00009888" value="0x0A5BC000" />
+        <register type="NOA" address="0x00009888" value="0x0C5B8000" />
+        <register type="NOA" address="0x00009888" value="0x0E5B4000" />
+        <register type="NOA" address="0x00009888" value="0x005B8000" />
+        <register type="NOA" address="0x00009888" value="0x025B4000" />
+        <register type="NOA" address="0x00009888" value="0x1A5C6000" />
+        <register type="NOA" address="0x00009888" value="0x1C5C001B" />
+        <register type="NOA" address="0x00009888" value="0x125C8000" />
+        <register type="NOA" address="0x00009888" value="0x145C8000" />
+        <register type="NOA" address="0x00009888" value="0x004C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C2000" />
+        <register type="NOA" address="0x00009888" value="0x0C4C0208" />
+        <register type="NOA" address="0x00009888" value="0x000DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D8000" />
+        <register type="NOA" address="0x00009888" value="0x080DA000" />
+        <register type="NOA" address="0x00009888" value="0x0A0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0E0DA000" />
+        <register type="NOA" address="0x00009888" value="0x020D2000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F5400" />
+        <register type="NOA" address="0x00009888" value="0x0E0F5500" />
+        <register type="NOA" address="0x00009888" value="0x100F0155" />
+        <register type="NOA" address="0x00009888" value="0x002C8000" />
+        <register type="NOA" address="0x00009888" value="0x0E2CC000" />
+        <register type="NOA" address="0x00009888" value="0x162CFB00" />
+        <register type="NOA" address="0x00009888" value="0x182C00BE" />
+        <register type="NOA" address="0x00009888" value="0x022CC000" />
+        <register type="NOA" address="0x00009888" value="0x042CC000" />
+        <register type="NOA" address="0x00009888" value="0x19900157" />
+        <register type="NOA" address="0x00009888" value="0x1B900158" />
+        <register type="NOA" address="0x00009888" value="0x1D900105" />
+        <register type="NOA" address="0x00009888" value="0x1F900103" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x11900FFF" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900800" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900863" />
+        <register type="NOA" address="0x00009888" value="0x47900802" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900802" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900002" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x43900C62" />
+        <register type="NOA" address="0x00009888" value="0x53903333" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00000003" />
+        <register type="FLEX" address="0x0000E658" value="0x00002001" />
+        <register type="FLEX" address="0x0000E758" value="0x00778008" />
+        <register type="FLEX" address="0x0000E45C" value="0x00088078" />
+        <register type="FLEX" address="0x0000E55C" value="0x00808708" />
+        <register type="FLEX" address="0x0000E65C" value="0x00A08908" />
+    </register_config>
+  </set>
+
+  <set name="Render Metrics for 3D Pipeline Profile Gen9"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="render_pipe_profile"
+       hw_config_guid="bd2d9cae-b9ec-4f5b-9d2f-934bed398a2d"
+       chipset="SKLGT3"
+       symbol_name="RenderPipeProfile"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Bottleneck"
+             low_watermark="10"
+             description="The percentage of time in which vertex shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="30"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_bottleneck"
+             units="percent"
+             symbol_name="VsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Hi-Depth Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which early hierarchical depth test pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="hi_depth_bottleneck"
+             units="percent"
+             symbol_name="HiDepthBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which geometry shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gs_bottleneck"
+             units="percent"
+             symbol_name="GsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Geometry Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="BC Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which barycentric coordinates calculation pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="bc_bottleneck"
+             units="percent"
+             symbol_name="BcBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Barycentric Calc"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HS Stall"
+             description="The percentage of time in which hull stall pipeline stage was stalled."
+             data_type="float"
+             equation="C 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="hs_stall"
+             units="percent"
+             symbol_name="HsStall"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Hull Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="VF Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which vertex fetch pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="C 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vf_bottleneck"
+             units="percent"
+             symbol_name="VfBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Input Assembler"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Strip-Fans Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which strip-fans pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="10"
+             equation="B 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sf_bottleneck"
+             units="percent"
+             symbol_name="SfBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Strip-Fans"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SF Stall"
+             description="The percentage of time in which strip-fans pipeline stage was stalled."
+             data_type="float"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sf_stall"
+             units="percent"
+             symbol_name="SfStall"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Strip-Fans"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HS Bottleneck"
+             low_watermark="3"
+             description="The percentage of time in which hull shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="9"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="hs_bottleneck"
+             units="percent"
+             symbol_name="HsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Hull Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="CL Stall"
+             description="The percentage of time in which clipper pipeline stage was stalled."
+             data_type="float"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="cl_stall"
+             units="percent"
+             symbol_name="ClStall"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Clipper"
+             />
+    <counter name="SO Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which stream output pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="so_bottleneck"
+             units="percent"
+             symbol_name="SoBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Stream Output"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="DS Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which domain shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ds_bottleneck"
+             units="percent"
+             symbol_name="DsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Domain Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Clipper Bottleneck"
+             low_watermark="10"
+             description="The percentage of time in which clipper pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="30"
+             equation="B 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="cl_bottleneck"
+             units="percent"
+             symbol_name="ClBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Clipper"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Stall"
+             description="The percentage of time in which domain shader pipeline stage was stalled."
+             data_type="float"
+             equation="C 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ds_stall"
+             units="percent"
+             symbol_name="DsStall"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Domain Shader"
+             />
+    <counter name="Early Depth Bottleneck"
+             low_watermark="10"
+             description="The percentage of time in which early depth test pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="30"
+             equation="B 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="early_depth_bottleneck"
+             units="percent"
+             symbol_name="EarlyDepthBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="SO Stall"
+             description="The percentage of time in which stream-output pipeline stage was stalled."
+             data_type="float"
+             equation="C 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="so_stall"
+             units="percent"
+             symbol_name="SoStall"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Stream Output"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x0C0E001F" />
+        <register type="NOA" address="0x00009888" value="0x0A0F0000" />
+        <register type="NOA" address="0x00009888" value="0x10116800" />
+        <register type="NOA" address="0x00009888" value="0x178A03E0" />
+        <register type="NOA" address="0x00009888" value="0x11824C00" />
+        <register type="NOA" address="0x00009888" value="0x11830020" />
+        <register type="NOA" address="0x00009888" value="0x13840020" />
+        <register type="NOA" address="0x00009888" value="0x11850019" />
+        <register type="NOA" address="0x00009888" value="0x11860007" />
+        <register type="NOA" address="0x00009888" value="0x01870C40" />
+        <register type="NOA" address="0x00009888" value="0x17880000" />
+        <register type="NOA" address="0x00009888" value="0x022F4000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C0040" />
+        <register type="NOA" address="0x00009888" value="0x0C0D8000" />
+        <register type="NOA" address="0x00009888" value="0x040D4000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x020E5400" />
+        <register type="NOA" address="0x00009888" value="0x000E0000" />
+        <register type="NOA" address="0x00009888" value="0x080F0040" />
+        <register type="NOA" address="0x00009888" value="0x000F0000" />
+        <register type="NOA" address="0x00009888" value="0x100F0000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0040" />
+        <register type="NOA" address="0x00009888" value="0x0C2C8000" />
+        <register type="NOA" address="0x00009888" value="0x06104000" />
+        <register type="NOA" address="0x00009888" value="0x06110012" />
+        <register type="NOA" address="0x00009888" value="0x06131000" />
+        <register type="NOA" address="0x00009888" value="0x01898000" />
+        <register type="NOA" address="0x00009888" value="0x0D890100" />
+        <register type="NOA" address="0x00009888" value="0x03898000" />
+        <register type="NOA" address="0x00009888" value="0x09808000" />
+        <register type="NOA" address="0x00009888" value="0x0B808000" />
+        <register type="NOA" address="0x00009888" value="0x0380C000" />
+        <register type="NOA" address="0x00009888" value="0x0F8A0075" />
+        <register type="NOA" address="0x00009888" value="0x1D8A0000" />
+        <register type="NOA" address="0x00009888" value="0x118A8000" />
+        <register type="NOA" address="0x00009888" value="0x1B8A4000" />
+        <register type="NOA" address="0x00009888" value="0x138A8000" />
+        <register type="NOA" address="0x00009888" value="0x1D81A000" />
+        <register type="NOA" address="0x00009888" value="0x15818000" />
+        <register type="NOA" address="0x00009888" value="0x17818000" />
+        <register type="NOA" address="0x00009888" value="0x0B820030" />
+        <register type="NOA" address="0x00009888" value="0x07828000" />
+        <register type="NOA" address="0x00009888" value="0x0D824000" />
+        <register type="NOA" address="0x00009888" value="0x0F828000" />
+        <register type="NOA" address="0x00009888" value="0x05824000" />
+        <register type="NOA" address="0x00009888" value="0x0D830003" />
+        <register type="NOA" address="0x00009888" value="0x0583000C" />
+        <register type="NOA" address="0x00009888" value="0x09830000" />
+        <register type="NOA" address="0x00009888" value="0x03838000" />
+        <register type="NOA" address="0x00009888" value="0x07838000" />
+        <register type="NOA" address="0x00009888" value="0x0B840980" />
+        <register type="NOA" address="0x00009888" value="0x03844D80" />
+        <register type="NOA" address="0x00009888" value="0x11840000" />
+        <register type="NOA" address="0x00009888" value="0x09848000" />
+        <register type="NOA" address="0x00009888" value="0x09850080" />
+        <register type="NOA" address="0x00009888" value="0x03850003" />
+        <register type="NOA" address="0x00009888" value="0x01850000" />
+        <register type="NOA" address="0x00009888" value="0x07860000" />
+        <register type="NOA" address="0x00009888" value="0x0F860400" />
+        <register type="NOA" address="0x00009888" value="0x09870032" />
+        <register type="NOA" address="0x00009888" value="0x01888052" />
+        <register type="NOA" address="0x00009888" value="0x11880000" />
+        <register type="NOA" address="0x00009888" value="0x09884000" />
+        <register type="NOA" address="0x00009888" value="0x1B931001" />
+        <register type="NOA" address="0x00009888" value="0x1D930001" />
+        <register type="NOA" address="0x00009888" value="0x19934000" />
+        <register type="NOA" address="0x00009888" value="0x1B958000" />
+        <register type="NOA" address="0x00009888" value="0x1D950094" />
+        <register type="NOA" address="0x00009888" value="0x19958000" />
+        <register type="NOA" address="0x00009888" value="0x09E58000" />
+        <register type="NOA" address="0x00009888" value="0x0BE58000" />
+        <register type="NOA" address="0x00009888" value="0x03E5C000" />
+        <register type="NOA" address="0x00009888" value="0x0592C000" />
+        <register type="NOA" address="0x00009888" value="0x0B928000" />
+        <register type="NOA" address="0x00009888" value="0x0D924000" />
+        <register type="NOA" address="0x00009888" value="0x0F924000" />
+        <register type="NOA" address="0x00009888" value="0x11928000" />
+        <register type="NOA" address="0x00009888" value="0x1392C000" />
+        <register type="NOA" address="0x00009888" value="0x09924000" />
+        <register type="NOA" address="0x00009888" value="0x01985000" />
+        <register type="NOA" address="0x00009888" value="0x07988000" />
+        <register type="NOA" address="0x00009888" value="0x09981000" />
+        <register type="NOA" address="0x00009888" value="0x0B982000" />
+        <register type="NOA" address="0x00009888" value="0x0D982000" />
+        <register type="NOA" address="0x00009888" value="0x0F989000" />
+        <register type="NOA" address="0x00009888" value="0x05982000" />
+        <register type="NOA" address="0x00009888" value="0x13904000" />
+        <register type="NOA" address="0x00009888" value="0x21904000" />
+        <register type="NOA" address="0x00009888" value="0x23904000" />
+        <register type="NOA" address="0x00009888" value="0x25908000" />
+        <register type="NOA" address="0x00009888" value="0x27904000" />
+        <register type="NOA" address="0x00009888" value="0x29908000" />
+        <register type="NOA" address="0x00009888" value="0x2B904000" />
+        <register type="NOA" address="0x00009888" value="0x2F904000" />
+        <register type="NOA" address="0x00009888" value="0x31904000" />
+        <register type="NOA" address="0x00009888" value="0x15904000" />
+        <register type="NOA" address="0x00009888" value="0x17908000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B904000" />
+        <register type="NOA" address="0x00009888" value="0x1190C080" />
+        <register type="NOA" address="0x00009888" value="0x51901150" />
+        <register type="NOA" address="0x00009888" value="0x41901400" />
+        <register type="NOA" address="0x00009888" value="0x55905111" />
+        <register type="NOA" address="0x00009888" value="0x45901400" />
+        <register type="NOA" address="0x00009888" value="0x479004A5" />
+        <register type="NOA" address="0x00009888" value="0x57903455" />
+        <register type="NOA" address="0x00009888" value="0x49900000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B9000A0" />
+        <register type="NOA" address="0x00009888" value="0x59900001" />
+        <register type="NOA" address="0x00009888" value="0x43900005" />
+        <register type="NOA" address="0x00009888" value="0x53900455" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007FFEA" />
+        <register type="OA" address="0x00002774" value="0x00007FFC" />
+        <register type="OA" address="0x00002778" value="0x0007AFFA" />
+        <register type="OA" address="0x0000277C" value="0x0000F5FD" />
+        <register type="OA" address="0x00002780" value="0x00079FFA" />
+        <register type="OA" address="0x00002784" value="0x0000F3FB" />
+        <register type="OA" address="0x00002788" value="0x0007BF7A" />
+        <register type="OA" address="0x0000278C" value="0x0000F7E7" />
+        <register type="OA" address="0x00002790" value="0x0007FEFA" />
+        <register type="OA" address="0x00002794" value="0x0000F7CF" />
+        <register type="OA" address="0x00002798" value="0x00077FFA" />
+        <register type="OA" address="0x0000279C" value="0x0000EFDF" />
+        <register type="OA" address="0x000027A0" value="0x0006FFFA" />
+        <register type="OA" address="0x000027A4" value="0x0000CFBF" />
+        <register type="OA" address="0x000027A8" value="0x0003FFFA" />
+        <register type="OA" address="0x000027AC" value="0x00005F7F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00015014" />
+        <register type="FLEX" address="0x0000E658" value="0x00025024" />
+        <register type="FLEX" address="0x0000E758" value="0x00035034" />
+        <register type="FLEX" address="0x0000E45C" value="0x00045044" />
+        <register type="FLEX" address="0x0000E55C" value="0x00055054" />
+        <register type="FLEX" address="0x0000E65C" value="0x00065064" />
+    </register_config>
+  </set>
+
+  <set name="Memory Reads Distribution Gen9"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="memory_reads"
+       hw_config_guid="4ca0f3fe-7fd3-4924-98cb-1807d9879767"
+       chipset="SKLGT3"
+       symbol_name="MemoryReads"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiL3Bank0Reads"
+             description="The total number of GTI memory reads from L3 Bank 0 (L3 Cache misses)."
+             data_type="uint64"
+             equation="C 4 READ"
+             underscore_name="gti_l3_bank0_reads"
+             units="messages"
+             symbol_name="GtiL3Bank0Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="GtiRingAccesses"
+             description="The total number of all accesses from GTI to the ring."
+             data_type="uint64"
+             equation="C 3 READ 2 UMUL"
+             underscore_name="gti_ring_accesses"
+             units="messages"
+             symbol_name="GtiRingAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="GtiL3Bank3Reads"
+             description="The total number of GTI memory reads from L3 Bank 3 (L3 Cache misses)."
+             data_type="uint64"
+             equation="C 7 READ"
+             underscore_name="gti_l3_bank3_reads"
+             units="messages"
+             symbol_name="GtiL3Bank3Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="GtiRsMemoryReads"
+             description="The total number of GTI memory reads from Resource Streamer."
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="gti_rs_memory_reads"
+             units="messages"
+             symbol_name="GtiRsMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Resource Streamer"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GtiHizMemoryReads"
+             description="The total number of GTI memory reads from Hierarchical Depth Cache (Hi-Depth Cache misses)."
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="gti_hiz_memory_reads"
+             units="messages"
+             symbol_name="GtiHizMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="GtiRccMemoryReads"
+             description="The total number of GTI memory reads from Render Color Cache (Render Color Cache misses)."
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="gti_rcc_memory_reads"
+             units="messages"
+             symbol_name="GtiRccMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Color Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiL3Bank1Reads"
+             description="The total number of GTI memory reads from L3 Bank 1 (L3 Cache misses)."
+             data_type="uint64"
+             equation="C 5 READ"
+             underscore_name="gti_l3_bank1_reads"
+             units="messages"
+             symbol_name="GtiL3Bank1Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiCmdStreamerMemoryReads"
+             description="The total number of GTI memory reads from Command Streamer."
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="gti_cmd_streamer_memory_reads"
+             units="messages"
+             symbol_name="GtiCmdStreamerMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Command Streamer"
+             />
+    <counter name="GtiL3Bank2Reads"
+             description="The total number of GTI memory reads from L3 Bank 2 (L3 Cache misses)."
+             data_type="uint64"
+             equation="C 6 READ"
+             underscore_name="gti_l3_bank2_reads"
+             units="messages"
+             symbol_name="GtiL3Bank2Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiMemoryReads"
+             description="The total number of GTI memory reads."
+             data_type="uint64"
+             equation="C 0 READ"
+             underscore_name="gti_memory_reads"
+             units="messages"
+             symbol_name="GtiMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="GtiRczMemoryReads"
+             description="The total number of GTI memory reads from Render Depth Cache (Render Depth Cache misses)."
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="gti_rcz_memory_reads"
+             units="messages"
+             symbol_name="GtiRczMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="GtiMscMemoryReads"
+             description="The total number of GTI memory reads from Multisampling Color Cache (Multisampling Color Cache misses)."
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="gti_msc_memory_reads"
+             units="messages"
+             symbol_name="GtiMscMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Color Cache"
+             />
+    <counter name="GtiVfMemoryReads"
+             description="The total number of GTI memory reads from Vertex Fetch."
+             data_type="uint64"
+             equation="B 1 READ"
+             underscore_name="gti_vf_memory_reads"
+             units="messages"
+             symbol_name="GtiVfMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Vertex Fetch"
+             />
+    <counter name="GtiStcMemoryReads"
+             description="The total number of GTI memory reads from Stencil Cache (Stencil Cache misses)."
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="gti_stc_memory_reads"
+             units="messages"
+             symbol_name="GtiStcMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiL3Reads"
+             description="The total number of GTI memory reads from L3 (L3 Cache misses)."
+             data_type="uint64"
+             equation="$GtiL3Bank0Reads $GtiL3Bank1Reads $GtiL3Bank2Reads $GtiL3Bank3Reads UADD UADD UADD"
+             underscore_name="gti_l3_reads"
+             units="messages"
+             symbol_name="GtiL3Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x11810C00" />
+        <register type="NOA" address="0x00009888" value="0x1381001A" />
+        <register type="NOA" address="0x00009888" value="0x37906800" />
+        <register type="NOA" address="0x00009888" value="0x3F900064" />
+        <register type="NOA" address="0x00009888" value="0x03811300" />
+        <register type="NOA" address="0x00009888" value="0x05811B12" />
+        <register type="NOA" address="0x00009888" value="0x0781001A" />
+        <register type="NOA" address="0x00009888" value="0x1F810000" />
+        <register type="NOA" address="0x00009888" value="0x17810000" />
+        <register type="NOA" address="0x00009888" value="0x19810000" />
+        <register type="NOA" address="0x00009888" value="0x1B810000" />
+        <register type="NOA" address="0x00009888" value="0x1D810000" />
+        <register type="NOA" address="0x00009888" value="0x1B930055" />
+        <register type="NOA" address="0x00009888" value="0x03E58000" />
+        <register type="NOA" address="0x00009888" value="0x05E5C000" />
+        <register type="NOA" address="0x00009888" value="0x07E54000" />
+        <register type="NOA" address="0x00009888" value="0x13900150" />
+        <register type="NOA" address="0x00009888" value="0x21900151" />
+        <register type="NOA" address="0x00009888" value="0x23900152" />
+        <register type="NOA" address="0x00009888" value="0x25900153" />
+        <register type="NOA" address="0x00009888" value="0x27900154" />
+        <register type="NOA" address="0x00009888" value="0x29900155" />
+        <register type="NOA" address="0x00009888" value="0x2B900156" />
+        <register type="NOA" address="0x00009888" value="0x2D900157" />
+        <register type="NOA" address="0x00009888" value="0x2F90015F" />
+        <register type="NOA" address="0x00009888" value="0x31900105" />
+        <register type="NOA" address="0x00009888" value="0x15900103" />
+        <register type="NOA" address="0x00009888" value="0x17900101" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B908000" />
+        <register type="NOA" address="0x00009888" value="0x1D908000" />
+        <register type="NOA" address="0x00009888" value="0x1F908000" />
+        <register type="NOA" address="0x00009888" value="0x11900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900C60" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900C00" />
+        <register type="NOA" address="0x00009888" value="0x47900C63" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900C63" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900063" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x43900003" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x0000272C" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002728" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x0000271C" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002718" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x0000274C" value="0x86543210" />
+        <register type="OA" address="0x00002748" value="0x86543210" />
+        <register type="OA" address="0x00002744" value="0x00006667" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x0000275C" value="0x86543210" />
+        <register type="OA" address="0x00002758" value="0x86543210" />
+        <register type="OA" address="0x00002754" value="0x00006465" />
+        <register type="OA" address="0x00002750" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007F81A" />
+        <register type="OA" address="0x00002774" value="0x0000FE00" />
+        <register type="OA" address="0x00002778" value="0x0007F82A" />
+        <register type="OA" address="0x0000277C" value="0x0000FE00" />
+        <register type="OA" address="0x00002780" value="0x0007F872" />
+        <register type="OA" address="0x00002784" value="0x0000FE00" />
+        <register type="OA" address="0x00002788" value="0x0007F8BA" />
+        <register type="OA" address="0x0000278C" value="0x0000FE00" />
+        <register type="OA" address="0x00002790" value="0x0007F87A" />
+        <register type="OA" address="0x00002794" value="0x0000FE00" />
+        <register type="OA" address="0x00002798" value="0x0007F8EA" />
+        <register type="OA" address="0x0000279C" value="0x0000FE00" />
+        <register type="OA" address="0x000027A0" value="0x0007F8E2" />
+        <register type="OA" address="0x000027A4" value="0x0000FE00" />
+        <register type="OA" address="0x000027A8" value="0x0007F8F2" />
+        <register type="OA" address="0x000027AC" value="0x0000FE00" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00015014" />
+        <register type="FLEX" address="0x0000E658" value="0x00025024" />
+        <register type="FLEX" address="0x0000E758" value="0x00035034" />
+        <register type="FLEX" address="0x0000E45C" value="0x00045044" />
+        <register type="FLEX" address="0x0000E55C" value="0x00055054" />
+        <register type="FLEX" address="0x0000E65C" value="0x00065064" />
+    </register_config>
+  </set>
+
+  <set name="Memory Writes Distribution Gen9"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="memory_writes"
+       hw_config_guid="a0c0172c-ee13-403d-99ff-2bdf6936cf14"
+       chipset="SKLGT3"
+       symbol_name="MemoryWrites"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiMemoryWrites"
+             description="The total number of GTI memory writes."
+             data_type="uint64"
+             equation="C 0 READ"
+             underscore_name="gti_memory_writes"
+             units="messages"
+             symbol_name="GtiMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="GtiRingAccesses"
+             description="The total number of all GTI accesses to the ring."
+             data_type="uint64"
+             equation="C 3 READ 2 UMUL"
+             underscore_name="gti_ring_accesses"
+             units="messages"
+             symbol_name="GtiRingAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="GtiMscMemoryWrites"
+             description="The total number of GTI memory writes from Multisampling Color Cache (Multisampling Color Cache invalidations)."
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="gti_msc_memory_writes"
+             units="messages"
+             symbol_name="GtiMscMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Color Cache"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="GtiCmdStreamerMemoryWrites"
+             description="The total number of GTI memory writes from Command Streamer."
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="gti_cmd_streamer_memory_writes"
+             units="messages"
+             symbol_name="GtiCmdStreamerMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Command Streamer"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GtiL3Bank0Writes"
+             description="The total number of GTI memory writes from L3 Bank 0 (L3 Bank 0 invalidations)."
+             data_type="uint64"
+             equation="C 4 READ"
+             underscore_name="gti_l3_bank0_writes"
+             units="messages"
+             symbol_name="GtiL3Bank0Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiL3Bank1Writes"
+             description="The total number of GTI memory writes from L3 Bank 1 (L3 Bank 1 invalidations)."
+             data_type="uint64"
+             equation="C 5 READ"
+             underscore_name="gti_l3_bank1_writes"
+             units="messages"
+             symbol_name="GtiL3Bank1Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiL3Bank2Writes"
+             description="The total number of GTI memory writes from L3 Bank 2 (L3 Bank 2 invalidations)."
+             data_type="uint64"
+             equation="C 6 READ"
+             underscore_name="gti_l3_bank2_writes"
+             units="messages"
+             symbol_name="GtiL3Bank2Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiL3Bank3Writes"
+             description="The total number of GTI memory writes from L3 Bank 3 (L3 Bank 3 invalidations)."
+             data_type="uint64"
+             equation="C 7 READ"
+             underscore_name="gti_l3_bank3_writes"
+             units="messages"
+             symbol_name="GtiL3Bank3Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiL3Writes"
+             description="The total number of GTI memory writes from L3 (L3 invalidations)."
+             data_type="uint64"
+             equation="$GtiL3Bank0Writes $GtiL3Bank1Writes $GtiL3Bank2Writes $GtiL3Bank3Writes UADD UADD UADD"
+             underscore_name="gti_l3_writes"
+             units="messages"
+             symbol_name="GtiL3Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiRccMemoryWrites"
+             description="The total number of GTI memory writes from Render Color Cache (Render Color Cache invalidations)."
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="gti_rcc_memory_writes"
+             units="messages"
+             symbol_name="GtiRccMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Color Cache"
+             />
+    <counter name="GtiSoMemoryWrites"
+             description="The total number of GTI memory writes from Stream Output."
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="gti_so_memory_writes"
+             units="messages"
+             symbol_name="GtiSoMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Stream Output"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiStcMemoryWrites"
+             description="The total number of GTI memory writes from Stencil Cache."
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="gti_stc_memory_writes"
+             units="messages"
+             symbol_name="GtiStcMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="GtiRczMemoryWrites"
+             description="The total number of GTI memory writes from Render Depth Cache."
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="gti_rcz_memory_writes"
+             units="messages"
+             symbol_name="GtiRczMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="GtiHizMemoryWrites"
+             description="The total number of GTI memory writes from Hierarchical Depth Cache."
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="gti_hiz_memory_writes"
+             units="messages"
+             symbol_name="GtiHizMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x11810C00" />
+        <register type="NOA" address="0x00009888" value="0x1381001A" />
+        <register type="NOA" address="0x00009888" value="0x37906800" />
+        <register type="NOA" address="0x00009888" value="0x3F901000" />
+        <register type="NOA" address="0x00009888" value="0x03811300" />
+        <register type="NOA" address="0x00009888" value="0x05811B12" />
+        <register type="NOA" address="0x00009888" value="0x0781001A" />
+        <register type="NOA" address="0x00009888" value="0x1F810000" />
+        <register type="NOA" address="0x00009888" value="0x17810000" />
+        <register type="NOA" address="0x00009888" value="0x19810000" />
+        <register type="NOA" address="0x00009888" value="0x1B810000" />
+        <register type="NOA" address="0x00009888" value="0x1D810000" />
+        <register type="NOA" address="0x00009888" value="0x1B930055" />
+        <register type="NOA" address="0x00009888" value="0x03E58000" />
+        <register type="NOA" address="0x00009888" value="0x05E5C000" />
+        <register type="NOA" address="0x00009888" value="0x07E54000" />
+        <register type="NOA" address="0x00009888" value="0x13900160" />
+        <register type="NOA" address="0x00009888" value="0x21900161" />
+        <register type="NOA" address="0x00009888" value="0x23900162" />
+        <register type="NOA" address="0x00009888" value="0x25900163" />
+        <register type="NOA" address="0x00009888" value="0x27900164" />
+        <register type="NOA" address="0x00009888" value="0x29900165" />
+        <register type="NOA" address="0x00009888" value="0x2B900166" />
+        <register type="NOA" address="0x00009888" value="0x2D900167" />
+        <register type="NOA" address="0x00009888" value="0x2F900150" />
+        <register type="NOA" address="0x00009888" value="0x31900105" />
+        <register type="NOA" address="0x00009888" value="0x15900103" />
+        <register type="NOA" address="0x00009888" value="0x17900101" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B908000" />
+        <register type="NOA" address="0x00009888" value="0x1D908000" />
+        <register type="NOA" address="0x00009888" value="0x1F908000" />
+        <register type="NOA" address="0x00009888" value="0x11900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900C60" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900C00" />
+        <register type="NOA" address="0x00009888" value="0x47900C63" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900C63" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900063" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x43900003" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x0000272C" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002728" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x0000271C" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002718" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x0000274C" value="0x86543210" />
+        <register type="OA" address="0x00002748" value="0x86543210" />
+        <register type="OA" address="0x00002744" value="0x00006667" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x0000275C" value="0x86543210" />
+        <register type="OA" address="0x00002758" value="0x86543210" />
+        <register type="OA" address="0x00002754" value="0x00006465" />
+        <register type="OA" address="0x00002750" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007F81A" />
+        <register type="OA" address="0x00002774" value="0x0000FE00" />
+        <register type="OA" address="0x00002778" value="0x0007F82A" />
+        <register type="OA" address="0x0000277C" value="0x0000FE00" />
+        <register type="OA" address="0x00002780" value="0x0007F822" />
+        <register type="OA" address="0x00002784" value="0x0000FE00" />
+        <register type="OA" address="0x00002788" value="0x0007F8BA" />
+        <register type="OA" address="0x0000278C" value="0x0000FE00" />
+        <register type="OA" address="0x00002790" value="0x0007F87A" />
+        <register type="OA" address="0x00002794" value="0x0000FE00" />
+        <register type="OA" address="0x00002798" value="0x0007F8EA" />
+        <register type="OA" address="0x0000279C" value="0x0000FE00" />
+        <register type="OA" address="0x000027A0" value="0x0007F8E2" />
+        <register type="OA" address="0x000027A4" value="0x0000FE00" />
+        <register type="OA" address="0x000027A8" value="0x0007F8F2" />
+        <register type="OA" address="0x000027AC" value="0x0000FE00" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00015014" />
+        <register type="FLEX" address="0x0000E658" value="0x00025024" />
+        <register type="FLEX" address="0x0000E758" value="0x00035034" />
+        <register type="FLEX" address="0x0000E45C" value="0x00045044" />
+        <register type="FLEX" address="0x0000E55C" value="0x00055054" />
+        <register type="FLEX" address="0x0000E65C" value="0x00065064" />
+    </register_config>
+  </set>
+
+  <set name="Compute Metrics Extended Gen9"
+       mdapi_supported_apis="VK OGL4 OCL IO BB"
+       underscore_name="compute_extended"
+       hw_config_guid="52435e0b-f188-42ea-8680-21a56ee20dee"
+       chipset="SKLGT3"
+       symbol_name="ComputeExtended"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu0_active"
+             units="percent"
+             symbol_name="Fpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active"
+             units="percent"
+             symbol_name="Fpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU AVG IPC Rate"
+             description="The average rate of IPC calculated for 2 FPU pipelines."
+             data_type="float"
+             max_equation="2"
+             equation="A 9 READ  A 10 READ  A 11 READ UADD  A 9 READ USUB FDIV 1 FADD"
+             underscore_name="eu_avg_ipc_rate"
+             units="number"
+             symbol_name="EuAvgIpcRate"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Typed Writes 0"
+             description="The subslice 0 typed writes."
+             data_type="uint64"
+             equation="C 0 READ"
+             underscore_name="typed_writes0"
+             units="messages"
+             symbol_name="TypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuTypedAtomics0"
+             description="The subslice 0 EU Typed Atomics subslice 0."
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="eu_typed_atomics0"
+             units="messages"
+             symbol_name="EuTypedAtomics0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Typed Atomics 0"
+             description="The subslice 0 typed atomics."
+             data_type="uint64"
+             equation="C 4 READ"
+             underscore_name="typed_atomics0"
+             units="messages"
+             symbol_name="TypedAtomics0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="TypedAtomicsPerCacheLine"
+             description="The ratio of EU typed atomics requests to L3 cache line writes."
+             data_type="float"
+             equation="$EuTypedAtomics0 $TypedAtomics0 FDIV"
+             underscore_name="typed_atomics_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="TypedAtomicsPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuUntypedReads0"
+             description="The subslice 0 EU Untyped Reads subslice 0."
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="eu_untyped_reads0"
+             units="messages"
+             symbol_name="EuUntypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Untyped Writes 0"
+             description="The subslice 0 untyped writes (including SLM writes)."
+             data_type="uint64"
+             equation="C 1 READ"
+             underscore_name="untyped_writes0"
+             units="messages"
+             symbol_name="UntypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuUntypedAtomics0"
+             description="The subslice 0 EU Untyped Atomics subslice 0."
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="eu_untyped_atomics0"
+             units="messages"
+             symbol_name="EuUntypedAtomics0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuUntypedWrites0"
+             description="The subslice 0 EU Untyped Writes subslice 0."
+             data_type="uint64"
+             equation="B 1 READ"
+             underscore_name="eu_untyped_writes0"
+             units="messages"
+             symbol_name="EuUntypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuA64UntypedWrites0"
+             description="The subslice 0 EU A64 Untyped Writes subslice 0."
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="eu_a64_untyped_writes0"
+             units="messages"
+             symbol_name="EuA64UntypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="UntypedWritesPerCacheLine"
+             description="The ratio of EU untyped write requests to L3 cache line writes."
+             data_type="float"
+             equation="$EuUntypedWrites0 $EuA64UntypedWrites0 UADD $UntypedWrites0 FDIV"
+             underscore_name="untyped_writes_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="UntypedWritesPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EuTypedWrites0"
+             description="The subslice 0 EU Typed Writes subslice 0."
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="eu_typed_writes0"
+             units="messages"
+             symbol_name="EuTypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="TypedWritesPerCacheLine"
+             description="The ratio of EU typed write requests to L3 cache line writes."
+             data_type="float"
+             equation="$EuTypedWrites0 $TypedWrites0 FDIV"
+             underscore_name="typed_writes_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="TypedWritesPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Typed Reads 0"
+             description="The subslice 0 typed reads."
+             data_type="uint64"
+             equation="C 2 READ"
+             underscore_name="typed_reads0"
+             units="messages"
+             symbol_name="TypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Untyped Reads 0"
+             description="The subslice 0 untyped reads (including SLM reads)."
+             data_type="uint64"
+             equation="C 3 READ"
+             underscore_name="untyped_reads0"
+             units="messages"
+             symbol_name="UntypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuA64UntypedReads0"
+             description="The subslice 0 EU A64 Untyped Reads subslice 0."
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="eu_a64_untyped_reads0"
+             units="messages"
+             symbol_name="EuA64UntypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EU Thread Occupancy"
+             description="The percentage of time in which hardware threads occupied EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ 8 UMUL $EuCoresTotalCount UDIV $EuThreadsCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_thread_occupancy"
+             units="percent"
+             symbol_name="EuThreadOccupancy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EuTypedReads0"
+             description="The subslice 0 EU Typed Reads subslice 0."
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="eu_typed_reads0"
+             units="messages"
+             symbol_name="EuTypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="UntypedReadsPerCacheLine"
+             description="The ratio of EU untyped read requests to L3 cache line reads."
+             data_type="float"
+             equation="$EuUntypedReads0 $EuA64UntypedReads0 UADD $UntypedReads0 FDIV"
+             underscore_name="untyped_reads_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="UntypedReadsPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="TypedReadsPerCacheLine"
+             description="The ratio of EU typed read requests to L3 cache line reads."
+             data_type="float"
+             equation="$EuTypedReads0 $TypedReads0 FDIV"
+             underscore_name="typed_reads_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="TypedReadsPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="EU Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_send_active"
+             units="percent"
+             symbol_name="EuSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x106C00E0" />
+        <register type="NOA" address="0x00009888" value="0x141C8160" />
+        <register type="NOA" address="0x00009888" value="0x161C8015" />
+        <register type="NOA" address="0x00009888" value="0x181C0120" />
+        <register type="NOA" address="0x00009888" value="0x004E8000" />
+        <register type="NOA" address="0x00009888" value="0x0E4E8000" />
+        <register type="NOA" address="0x00009888" value="0x184E8000" />
+        <register type="NOA" address="0x00009888" value="0x1A4EAAA0" />
+        <register type="NOA" address="0x00009888" value="0x1C4E0002" />
+        <register type="NOA" address="0x00009888" value="0x024E8000" />
+        <register type="NOA" address="0x00009888" value="0x044E8000" />
+        <register type="NOA" address="0x00009888" value="0x064E8000" />
+        <register type="NOA" address="0x00009888" value="0x084E8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4E8000" />
+        <register type="NOA" address="0x00009888" value="0x0E6C0B01" />
+        <register type="NOA" address="0x00009888" value="0x006C0200" />
+        <register type="NOA" address="0x00009888" value="0x026C000C" />
+        <register type="NOA" address="0x00009888" value="0x1C6C0000" />
+        <register type="NOA" address="0x00009888" value="0x1E6C0000" />
+        <register type="NOA" address="0x00009888" value="0x1A6C0000" />
+        <register type="NOA" address="0x00009888" value="0x0E1BC000" />
+        <register type="NOA" address="0x00009888" value="0x001B8000" />
+        <register type="NOA" address="0x00009888" value="0x021BC000" />
+        <register type="NOA" address="0x00009888" value="0x001C0041" />
+        <register type="NOA" address="0x00009888" value="0x061C4200" />
+        <register type="NOA" address="0x00009888" value="0x081C4443" />
+        <register type="NOA" address="0x00009888" value="0x0A1C4645" />
+        <register type="NOA" address="0x00009888" value="0x0C1C7647" />
+        <register type="NOA" address="0x00009888" value="0x041C7357" />
+        <register type="NOA" address="0x00009888" value="0x1C1C0030" />
+        <register type="NOA" address="0x00009888" value="0x101C0000" />
+        <register type="NOA" address="0x00009888" value="0x1A1C0000" />
+        <register type="NOA" address="0x00009888" value="0x121C8000" />
+        <register type="NOA" address="0x00009888" value="0x004C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4CAA2A" />
+        <register type="NOA" address="0x00009888" value="0x0C4C02AA" />
+        <register type="NOA" address="0x00009888" value="0x084CA000" />
+        <register type="NOA" address="0x00009888" value="0x000DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D8000" />
+        <register type="NOA" address="0x00009888" value="0x080DA000" />
+        <register type="NOA" address="0x00009888" value="0x0A0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0E0DA000" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F5400" />
+        <register type="NOA" address="0x00009888" value="0x0E0F5515" />
+        <register type="NOA" address="0x00009888" value="0x100F0155" />
+        <register type="NOA" address="0x00009888" value="0x002C8000" />
+        <register type="NOA" address="0x00009888" value="0x0E2C8000" />
+        <register type="NOA" address="0x00009888" value="0x162CAA00" />
+        <register type="NOA" address="0x00009888" value="0x182C00AA" />
+        <register type="NOA" address="0x00009888" value="0x022C8000" />
+        <register type="NOA" address="0x00009888" value="0x042C8000" />
+        <register type="NOA" address="0x00009888" value="0x062C8000" />
+        <register type="NOA" address="0x00009888" value="0x082C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x11907FFF" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900040" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900802" />
+        <register type="NOA" address="0x00009888" value="0x47900842" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900842" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900000" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x43900800" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007FC2A" />
+        <register type="OA" address="0x00002774" value="0x0000BF00" />
+        <register type="OA" address="0x00002778" value="0x0007FC6A" />
+        <register type="OA" address="0x0000277C" value="0x0000BF00" />
+        <register type="OA" address="0x00002780" value="0x0007FC92" />
+        <register type="OA" address="0x00002784" value="0x0000BF00" />
+        <register type="OA" address="0x00002788" value="0x0007FCA2" />
+        <register type="OA" address="0x0000278C" value="0x0000BF00" />
+        <register type="OA" address="0x00002790" value="0x0007FC32" />
+        <register type="OA" address="0x00002794" value="0x0000BF00" />
+        <register type="OA" address="0x00002798" value="0x0007FC9A" />
+        <register type="OA" address="0x0000279C" value="0x0000BF00" />
+        <register type="OA" address="0x000027A0" value="0x0007FE6A" />
+        <register type="OA" address="0x000027A4" value="0x0000BF00" />
+        <register type="OA" address="0x000027A8" value="0x0007FE7A" />
+        <register type="OA" address="0x000027AC" value="0x0000BF00" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00000003" />
+        <register type="FLEX" address="0x0000E658" value="0x00002001" />
+        <register type="FLEX" address="0x0000E758" value="0x00778008" />
+        <register type="FLEX" address="0x0000E45C" value="0x00088078" />
+        <register type="FLEX" address="0x0000E55C" value="0x00808708" />
+        <register type="FLEX" address="0x0000E65C" value="0x00A08908" />
+    </register_config>
+  </set>
+
+  <set name="Compute Metrics L3 Cache Gen9"
+       mdapi_supported_apis="VK OGL4 OCL IO BB"
+       underscore_name="compute_l3_cache"
+       hw_config_guid="27076eeb-49f3-4fed-8423-c66506005c63"
+       chipset="SKLGT3"
+       symbol_name="ComputeL3Cache"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Bank 03 Accesses"
+             description="The total number of accesses to L3 Bank 03."
+             data_type="uint64"
+             equation="B 3 READ 2 UMUL"
+             underscore_name="l3_bank03_accesses"
+             units="messages"
+             symbol_name="L3Bank03Accesses"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="L3 Accesses"
+             description="The total number of L3 accesses from all entities."
+             data_type="uint64"
+             equation="C 0 READ C 1 READ B 2 READ B 3 READ UADD UADD UADD 2 UMUL"
+             underscore_name="l3_accesses"
+             units="messages"
+             symbol_name="L3Accesses"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Sampler Throughput"
+             description="The total number of GPU memory bytes transferred between samplers and L3 caches."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 29 READ 64 UMUL"
+             underscore_name="l3_sampler_throughput"
+             units="bytes"
+             symbol_name="L3SamplerThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Sampler"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu0_active"
+             units="percent"
+             symbol_name="Fpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active"
+             units="percent"
+             symbol_name="Fpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU AVG IPC Rate"
+             description="The average rate of IPC calculated for 2 FPU pipelines."
+             data_type="float"
+             max_equation="2"
+             equation="A 9 READ  A 10 READ  A 11 READ UADD  A 9 READ USUB FDIV 1 FADD"
+             underscore_name="eu_avg_ipc_rate"
+             units="number"
+             symbol_name="EuAvgIpcRate"
+             semantic_type="ratio"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Binary Instruction"
+             description="The percentage of time in which execution units were actively processing binary instructions on FPU0."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_binary_fpu0_instruction"
+             units="percent"
+             symbol_name="EuBinaryFpu0Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="EU FPU0 Hybrid Instruction"
+             description="The percentage of time in which execution units were actively processing hybrid instructions on FPU0."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_hybrid_fpu0_instruction"
+             units="percent"
+             symbol_name="EuHybridFpu0Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Misses"
+             description="The total number of L3 misses."
+             data_type="uint64"
+             equation="C 4 READ C 5 READ UADD"
+             underscore_name="l3_misses"
+             units="messages"
+             symbol_name="L3Misses"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/TAG"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="L3 Bank 00 Accesses"
+             description="The total number of accesses to L3 Bank 00."
+             data_type="uint64"
+             equation="C 0 READ 2 UMUL"
+             underscore_name="l3_bank00_accesses"
+             units="messages"
+             symbol_name="L3Bank00Accesses"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="EU FPU0 Move Instruction"
+             description="The percentage of time in which execution units were actively processing move instructions on FPU0."
+             data_type="float"
+             max_equation="100"
+             equation="A 19 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_move_fpu0_instruction"
+             units="percent"
+             symbol_name="EuMoveFpu0Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU FPU1 Hybrid Instruction"
+             description="The percentage of time in which execution units were actively processing hybrid instructions on FPU1."
+             data_type="float"
+             max_equation="100"
+             equation="A 14 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_hybrid_fpu1_instruction"
+             units="percent"
+             symbol_name="EuHybridFpu1Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Read Throughput"
+             description="The total number of GPU memory bytes read from GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="C 6 READ 64 UMUL"
+             underscore_name="gti_read_throughput"
+             units="bytes"
+             symbol_name="GtiReadThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI L3 Throughput"
+             description="The total number of GPU memory bytes transferred between L3 caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 4 READ C 5 READ UADD 64 UMUL"
+             underscore_name="gti_l3_throughput"
+             units="bytes"
+             symbol_name="GtiL3Throughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Bank 00 IC Accesses"
+             description="The total number of accesses to L3 Bank 00 from IC cache."
+             data_type="uint64"
+             equation="B 0 READ B 1 READ UADD 2 UMUL $L3Bank00Accesses UMIN"
+             underscore_name="l3_bank00_ic_accesses"
+             units="messages"
+             symbol_name="L3Bank00IcAccesses"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3/IC"
+             />
+    <counter name="L3 Bank 00 IC Hits"
+             description="The total number of hits in L3 Bank 00 from IC cache."
+             data_type="uint64"
+             equation="B 1 READ 2 UMUL $L3Bank00IcAccesses UMIN"
+             underscore_name="l3_bank00_ic_hits"
+             units="messages"
+             symbol_name="L3Bank00IcHits"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3/IC"
+             />
+    <counter name="Sampler Accesses"
+             description="The total number of messages send to samplers."
+             data_type="uint64"
+             equation="A 28 READ"
+             underscore_name="sampler_accesses"
+             units="messages"
+             symbol_name="SamplerAccesses"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler"
+             />
+    <counter name="L3 Bank 01 Accesses"
+             description="The total number of accesses to L3 Bank 01."
+             data_type="uint64"
+             equation="C 1 READ 2 UMUL"
+             underscore_name="l3_bank01_accesses"
+             units="messages"
+             symbol_name="L3Bank01Accesses"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Ternary Instruction"
+             description="The percentage of time in which execution units were actively processing ternary instructions on FPU0."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_ternary_fpu0_instruction"
+             units="percent"
+             symbol_name="EuTernaryFpu0Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU FPU1 Move Instruction"
+             description="The percentage of time in which execution units were actively processing move instructions on FPU1."
+             data_type="float"
+             max_equation="100"
+             equation="A 20 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_move_fpu1_instruction"
+             units="percent"
+             symbol_name="EuMoveFpu1Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="L3 Bank 02 Accesses"
+             description="The total number of accesses to L3 Bank 02."
+             data_type="uint64"
+             equation="B 2 READ 2 UMUL"
+             underscore_name="l3_bank02_accesses"
+             units="messages"
+             symbol_name="L3Bank02Accesses"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="L3 Total Throughput"
+             description="The total number of GPU memory bytes transferred via L3."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="$L3Accesses 64 UMUL"
+             underscore_name="l3_total_throughput"
+             units="bytes"
+             symbol_name="L3TotalThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Write Throughput"
+             description="The total number of GPU memory bytes written to GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 32 UMUL"
+             equation="C 7 READ 64 UMUL"
+             underscore_name="gti_write_throughput"
+             units="bytes"
+             symbol_name="GtiWriteThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="EU FPU1 Binary Instruction"
+             description="The percentage of time in which execution units were actively processing binary instructions on FPU1."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_binary_fpu1_instruction"
+             units="percent"
+             symbol_name="EuBinaryFpu1Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Ternary Instruction"
+             description="The percentage of time in which execution units were actively processing ternary instructions on FPU1."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_ternary_fpu1_instruction"
+             units="percent"
+             symbol_name="EuTernaryFpu1Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_send_active"
+             units="percent"
+             symbol_name="EuSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x166C0760" />
+        <register type="NOA" address="0x00009888" value="0x1593001E" />
+        <register type="NOA" address="0x00009888" value="0x3F900003" />
+        <register type="NOA" address="0x00009888" value="0x004E8000" />
+        <register type="NOA" address="0x00009888" value="0x0E4E8000" />
+        <register type="NOA" address="0x00009888" value="0x184E8000" />
+        <register type="NOA" address="0x00009888" value="0x1A4E8020" />
+        <register type="NOA" address="0x00009888" value="0x1C4E0002" />
+        <register type="NOA" address="0x00009888" value="0x006C0051" />
+        <register type="NOA" address="0x00009888" value="0x066C5000" />
+        <register type="NOA" address="0x00009888" value="0x086C5C5D" />
+        <register type="NOA" address="0x00009888" value="0x0E6C5E5F" />
+        <register type="NOA" address="0x00009888" value="0x106C0000" />
+        <register type="NOA" address="0x00009888" value="0x186C0000" />
+        <register type="NOA" address="0x00009888" value="0x1C6C0000" />
+        <register type="NOA" address="0x00009888" value="0x1E6C0000" />
+        <register type="NOA" address="0x00009888" value="0x001B4000" />
+        <register type="NOA" address="0x00009888" value="0x061B8000" />
+        <register type="NOA" address="0x00009888" value="0x081BC000" />
+        <register type="NOA" address="0x00009888" value="0x0E1BC000" />
+        <register type="NOA" address="0x00009888" value="0x101C8000" />
+        <register type="NOA" address="0x00009888" value="0x1A1CE000" />
+        <register type="NOA" address="0x00009888" value="0x1C1C0030" />
+        <register type="NOA" address="0x00009888" value="0x004C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C2A00" />
+        <register type="NOA" address="0x00009888" value="0x0C4C0280" />
+        <register type="NOA" address="0x00009888" value="0x000D2000" />
+        <register type="NOA" address="0x00009888" value="0x060D8000" />
+        <register type="NOA" address="0x00009888" value="0x080DA000" />
+        <register type="NOA" address="0x00009888" value="0x0E0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F0400" />
+        <register type="NOA" address="0x00009888" value="0x0E0F1500" />
+        <register type="NOA" address="0x00009888" value="0x100F0140" />
+        <register type="NOA" address="0x00009888" value="0x002C8000" />
+        <register type="NOA" address="0x00009888" value="0x0E2C8000" />
+        <register type="NOA" address="0x00009888" value="0x162C0A00" />
+        <register type="NOA" address="0x00009888" value="0x182C00A0" />
+        <register type="NOA" address="0x00009888" value="0x03933300" />
+        <register type="NOA" address="0x00009888" value="0x05930032" />
+        <register type="NOA" address="0x00009888" value="0x11930000" />
+        <register type="NOA" address="0x00009888" value="0x1B930000" />
+        <register type="NOA" address="0x00009888" value="0x1D900157" />
+        <register type="NOA" address="0x00009888" value="0x1F900158" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B908000" />
+        <register type="NOA" address="0x00009888" value="0x1190030F" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900000" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900063" />
+        <register type="NOA" address="0x00009888" value="0x47900000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900000" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x53903333" />
+        <register type="NOA" address="0x00009888" value="0x43900840" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x30800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x30800000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007FFFA" />
+        <register type="OA" address="0x00002774" value="0x0000FEFE" />
+        <register type="OA" address="0x00002778" value="0x0007FFFA" />
+        <register type="OA" address="0x0000277C" value="0x0000FEFD" />
+        <register type="OA" address="0x00002790" value="0x0007FFFA" />
+        <register type="OA" address="0x00002794" value="0x0000FBEF" />
+        <register type="OA" address="0x00002798" value="0x0007FFFA" />
+        <register type="OA" address="0x0000279C" value="0x0000FBDF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00000003" />
+        <register type="FLEX" address="0x0000E658" value="0x00002001" />
+        <register type="FLEX" address="0x0000E758" value="0x00101100" />
+        <register type="FLEX" address="0x0000E45C" value="0x00201200" />
+        <register type="FLEX" address="0x0000E55C" value="0x00301300" />
+        <register type="FLEX" address="0x0000E65C" value="0x00401400" />
+    </register_config>
+  </set>
+
+  <set name="Metric set HDCAndSF"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="hdc_and_sf"
+       hw_config_guid="a1b8363b-b986-47b6-929a-847afde3dec8"
+       chipset="SKLGT3"
+       symbol_name="HDCAndSF"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="Polygon Data Ready"
+             description="The percentage of time in which geometry pipeline output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="poly_data_ready"
+             units="percent"
+             symbol_name="PolyDataReady"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe/Strip-Fans"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="HDC stalled by L3 (s0.ss1)"
+             description="Percentage of time when HDC has messges to L3, but it's stalled due to lack of credits (s0.ss1)"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ C 4 READ USUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader01_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader01AccessStalledOnL3"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="HDC stalled by L3 (s0.ss2)"
+             description="Percentage of time when HDC has messges to L3, but it's stalled due to lack of credits (s0.ss2)"
+             data_type="float"
+             max_equation="100"
+             equation="C 3 READ C 2 READ USUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader02_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader02AccessStalledOnL3"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="HDC stalled by L3 (s0.ss0)"
+             description="Percentage of time when HDC has messges to L3, but it's stalled due to lack of credits (s0.ss0)"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ C 6 READ USUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader00_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader00AccessStalledOnL3"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x104F0232" />
+        <register type="NOA" address="0x00009888" value="0x124F4640" />
+        <register type="NOA" address="0x00009888" value="0x106C0232" />
+        <register type="NOA" address="0x00009888" value="0x11834400" />
+        <register type="NOA" address="0x00009888" value="0x0A4E8000" />
+        <register type="NOA" address="0x00009888" value="0x0C4E8000" />
+        <register type="NOA" address="0x00009888" value="0x004F1880" />
+        <register type="NOA" address="0x00009888" value="0x024F08BB" />
+        <register type="NOA" address="0x00009888" value="0x044F001B" />
+        <register type="NOA" address="0x00009888" value="0x046C0100" />
+        <register type="NOA" address="0x00009888" value="0x066C000B" />
+        <register type="NOA" address="0x00009888" value="0x1A6C0000" />
+        <register type="NOA" address="0x00009888" value="0x041B8000" />
+        <register type="NOA" address="0x00009888" value="0x061B4000" />
+        <register type="NOA" address="0x00009888" value="0x1A1C1800" />
+        <register type="NOA" address="0x00009888" value="0x005B8000" />
+        <register type="NOA" address="0x00009888" value="0x025BC000" />
+        <register type="NOA" address="0x00009888" value="0x045B4000" />
+        <register type="NOA" address="0x00009888" value="0x125C8000" />
+        <register type="NOA" address="0x00009888" value="0x145C8000" />
+        <register type="NOA" address="0x00009888" value="0x165C8000" />
+        <register type="NOA" address="0x00009888" value="0x185C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C00A0" />
+        <register type="NOA" address="0x00009888" value="0x000D8000" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F5000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0055" />
+        <register type="NOA" address="0x00009888" value="0x022CC000" />
+        <register type="NOA" address="0x00009888" value="0x042CC000" />
+        <register type="NOA" address="0x00009888" value="0x062CC000" />
+        <register type="NOA" address="0x00009888" value="0x082CC000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0F828000" />
+        <register type="NOA" address="0x00009888" value="0x0F8305C0" />
+        <register type="NOA" address="0x00009888" value="0x09830000" />
+        <register type="NOA" address="0x00009888" value="0x07830000" />
+        <register type="NOA" address="0x00009888" value="0x1D950080" />
+        <register type="NOA" address="0x00009888" value="0x13928000" />
+        <register type="NOA" address="0x00009888" value="0x0F988000" />
+        <register type="NOA" address="0x00009888" value="0x31904000" />
+        <register type="NOA" address="0x00009888" value="0x1190FC00" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x59900005" />
+        <register type="NOA" address="0x00009888" value="0x4B900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900800" />
+        <register type="NOA" address="0x00009888" value="0x43900842" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x10800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00000002" />
+        <register type="OA" address="0x00002774" value="0x0000FDFF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set L3_1"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="l3_1"
+       hw_config_guid="fa857069-7f95-44c9-a3e0-cb8ccbc35abb"
+       chipset="SKLGT3"
+       symbol_name="L3_1"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank1 Active"
+             description="The percentage of time in which slice0 L3 bank1 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank1_active"
+             units="percent"
+             symbol_name="L30Bank1Active"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="Slice0 L3 Bank1 Stalled"
+             description="The percentage of time in which slice0 L3 bank1 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank1_stalled"
+             units="percent"
+             symbol_name="L30Bank1Stalled"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank0 Active"
+             description="The percentage of time in which slice0 L3 bank0 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank0_active"
+             units="percent"
+             symbol_name="L30Bank0Active"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank0 Stalled"
+             description="The percentage of time in which slice0 L3 bank0 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank0_stalled"
+             units="percent"
+             symbol_name="L30Bank0Stalled"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x126C7B40" />
+        <register type="NOA" address="0x00009888" value="0x166C0020" />
+        <register type="NOA" address="0x00009888" value="0x0A603444" />
+        <register type="NOA" address="0x00009888" value="0x0A613400" />
+        <register type="NOA" address="0x00009888" value="0x1A4EA800" />
+        <register type="NOA" address="0x00009888" value="0x1C4E0002" />
+        <register type="NOA" address="0x00009888" value="0x024E8000" />
+        <register type="NOA" address="0x00009888" value="0x044E8000" />
+        <register type="NOA" address="0x00009888" value="0x064E8000" />
+        <register type="NOA" address="0x00009888" value="0x084E8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4E8000" />
+        <register type="NOA" address="0x00009888" value="0x064F4000" />
+        <register type="NOA" address="0x00009888" value="0x0C6C5327" />
+        <register type="NOA" address="0x00009888" value="0x0E6C5425" />
+        <register type="NOA" address="0x00009888" value="0x006C2A00" />
+        <register type="NOA" address="0x00009888" value="0x026C285B" />
+        <register type="NOA" address="0x00009888" value="0x046C005C" />
+        <register type="NOA" address="0x00009888" value="0x106C0000" />
+        <register type="NOA" address="0x00009888" value="0x1C6C0000" />
+        <register type="NOA" address="0x00009888" value="0x1E6C0000" />
+        <register type="NOA" address="0x00009888" value="0x1A6C0800" />
+        <register type="NOA" address="0x00009888" value="0x0C1BC000" />
+        <register type="NOA" address="0x00009888" value="0x0E1BC000" />
+        <register type="NOA" address="0x00009888" value="0x001B8000" />
+        <register type="NOA" address="0x00009888" value="0x021BC000" />
+        <register type="NOA" address="0x00009888" value="0x041BC000" />
+        <register type="NOA" address="0x00009888" value="0x1C1C003C" />
+        <register type="NOA" address="0x00009888" value="0x121C8000" />
+        <register type="NOA" address="0x00009888" value="0x141C8000" />
+        <register type="NOA" address="0x00009888" value="0x161C8000" />
+        <register type="NOA" address="0x00009888" value="0x181C8000" />
+        <register type="NOA" address="0x00009888" value="0x1A1C0800" />
+        <register type="NOA" address="0x00009888" value="0x065B4000" />
+        <register type="NOA" address="0x00009888" value="0x1A5C1000" />
+        <register type="NOA" address="0x00009888" value="0x10600000" />
+        <register type="NOA" address="0x00009888" value="0x04600000" />
+        <register type="NOA" address="0x00009888" value="0x0C610044" />
+        <register type="NOA" address="0x00009888" value="0x10610000" />
+        <register type="NOA" address="0x00009888" value="0x06610000" />
+        <register type="NOA" address="0x00009888" value="0x0C4C02A8" />
+        <register type="NOA" address="0x00009888" value="0x084CA000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C002A" />
+        <register type="NOA" address="0x00009888" value="0x0C0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0E0DA000" />
+        <register type="NOA" address="0x00009888" value="0x000D8000" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x100F0154" />
+        <register type="NOA" address="0x00009888" value="0x0C0F5000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0055" />
+        <register type="NOA" address="0x00009888" value="0x182C00AA" />
+        <register type="NOA" address="0x00009888" value="0x022C8000" />
+        <register type="NOA" address="0x00009888" value="0x042C8000" />
+        <register type="NOA" address="0x00009888" value="0x062C8000" />
+        <register type="NOA" address="0x00009888" value="0x082C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C2CC000" />
+        <register type="NOA" address="0x00009888" value="0x1190FFC0" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900420" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900021" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900400" />
+        <register type="NOA" address="0x00009888" value="0x43900421" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900040" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002770" value="0x00100070" />
+        <register type="OA" address="0x00002774" value="0x0000FFF1" />
+        <register type="OA" address="0x00002778" value="0x00014002" />
+        <register type="OA" address="0x0000277C" value="0x0000C3FF" />
+        <register type="OA" address="0x00002780" value="0x00010002" />
+        <register type="OA" address="0x00002784" value="0x0000C7FF" />
+        <register type="OA" address="0x00002788" value="0x00004002" />
+        <register type="OA" address="0x0000278C" value="0x0000D3FF" />
+        <register type="OA" address="0x00002790" value="0x00100700" />
+        <register type="OA" address="0x00002794" value="0x0000FF1F" />
+        <register type="OA" address="0x00002798" value="0x00001402" />
+        <register type="OA" address="0x0000279C" value="0x0000FC3F" />
+        <register type="OA" address="0x000027A0" value="0x00001002" />
+        <register type="OA" address="0x000027A4" value="0x0000FC7F" />
+        <register type="OA" address="0x000027A8" value="0x00000402" />
+        <register type="OA" address="0x000027AC" value="0x0000FD3F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set L3_2"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="l3_2"
+       hw_config_guid="9830a5f3-a5e2-4773-a49d-6371407c382a"
+       chipset="SKLGT3"
+       symbol_name="L3_2"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank2 Stalled"
+             description="The percentage of time in which slice0 L3 bank2 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank2_stalled"
+             units="percent"
+             symbol_name="L30Bank2Stalled"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank2 Active"
+             description="The percentage of time in which slice0 L3 bank2 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank2_active"
+             units="percent"
+             symbol_name="L30Bank2Active"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x126C02E0" />
+        <register type="NOA" address="0x00009888" value="0x146C0001" />
+        <register type="NOA" address="0x00009888" value="0x0A623400" />
+        <register type="NOA" address="0x00009888" value="0x044E8000" />
+        <register type="NOA" address="0x00009888" value="0x064E8000" />
+        <register type="NOA" address="0x00009888" value="0x084E8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4E8000" />
+        <register type="NOA" address="0x00009888" value="0x064F4000" />
+        <register type="NOA" address="0x00009888" value="0x026C3324" />
+        <register type="NOA" address="0x00009888" value="0x046C3422" />
+        <register type="NOA" address="0x00009888" value="0x106C0000" />
+        <register type="NOA" address="0x00009888" value="0x1A6C0000" />
+        <register type="NOA" address="0x00009888" value="0x021BC000" />
+        <register type="NOA" address="0x00009888" value="0x041BC000" />
+        <register type="NOA" address="0x00009888" value="0x141C8000" />
+        <register type="NOA" address="0x00009888" value="0x161C8000" />
+        <register type="NOA" address="0x00009888" value="0x181C8000" />
+        <register type="NOA" address="0x00009888" value="0x1A1C0800" />
+        <register type="NOA" address="0x00009888" value="0x065B4000" />
+        <register type="NOA" address="0x00009888" value="0x1A5C1000" />
+        <register type="NOA" address="0x00009888" value="0x06614000" />
+        <register type="NOA" address="0x00009888" value="0x0C620044" />
+        <register type="NOA" address="0x00009888" value="0x10620000" />
+        <register type="NOA" address="0x00009888" value="0x06620000" />
+        <register type="NOA" address="0x00009888" value="0x084C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C002A" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F4000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0055" />
+        <register type="NOA" address="0x00009888" value="0x042C8000" />
+        <register type="NOA" address="0x00009888" value="0x062C8000" />
+        <register type="NOA" address="0x00009888" value="0x082C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C2CC000" />
+        <register type="NOA" address="0x00009888" value="0x1190F800" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x43900000" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00100070" />
+        <register type="OA" address="0x00002774" value="0x0000FFF1" />
+        <register type="OA" address="0x00002778" value="0x00028002" />
+        <register type="OA" address="0x0000277C" value="0x000087FF" />
+        <register type="OA" address="0x00002780" value="0x00020002" />
+        <register type="OA" address="0x00002784" value="0x00008FFF" />
+        <register type="OA" address="0x00002788" value="0x00008002" />
+        <register type="OA" address="0x0000278C" value="0x0000A7FF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set L3_3"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="l3_3"
+       hw_config_guid="59452ceb-24bb-4878-87ec-87aab7b4f9db"
+       chipset="SKLGT3"
+       symbol_name="L3_3"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Slice0 L3 Bank3 Stalled"
+             description="The percentage of time in which slice0 L3 bank3 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank3_stalled"
+             units="percent"
+             symbol_name="L30Bank3Stalled"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank3 Active"
+             description="The percentage of time in which slice0 L3 bank3 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank3_active"
+             units="percent"
+             symbol_name="L30Bank3Active"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x126C4E80" />
+        <register type="NOA" address="0x00009888" value="0x146C0000" />
+        <register type="NOA" address="0x00009888" value="0x0A633400" />
+        <register type="NOA" address="0x00009888" value="0x044E8000" />
+        <register type="NOA" address="0x00009888" value="0x064E8000" />
+        <register type="NOA" address="0x00009888" value="0x084E8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4E8000" />
+        <register type="NOA" address="0x00009888" value="0x0C4E8000" />
+        <register type="NOA" address="0x00009888" value="0x026C3321" />
+        <register type="NOA" address="0x00009888" value="0x046C342F" />
+        <register type="NOA" address="0x00009888" value="0x106C0000" />
+        <register type="NOA" address="0x00009888" value="0x1A6C2000" />
+        <register type="NOA" address="0x00009888" value="0x021BC000" />
+        <register type="NOA" address="0x00009888" value="0x041BC000" />
+        <register type="NOA" address="0x00009888" value="0x061B4000" />
+        <register type="NOA" address="0x00009888" value="0x141C8000" />
+        <register type="NOA" address="0x00009888" value="0x161C8000" />
+        <register type="NOA" address="0x00009888" value="0x181C8000" />
+        <register type="NOA" address="0x00009888" value="0x1A1C1800" />
+        <register type="NOA" address="0x00009888" value="0x06604000" />
+        <register type="NOA" address="0x00009888" value="0x0C630044" />
+        <register type="NOA" address="0x00009888" value="0x10630000" />
+        <register type="NOA" address="0x00009888" value="0x06630000" />
+        <register type="NOA" address="0x00009888" value="0x084C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C00AA" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F4000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0055" />
+        <register type="NOA" address="0x00009888" value="0x042C8000" />
+        <register type="NOA" address="0x00009888" value="0x062C8000" />
+        <register type="NOA" address="0x00009888" value="0x082C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C2C8000" />
+        <register type="NOA" address="0x00009888" value="0x1190F800" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x43900842" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900002" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00100070" />
+        <register type="OA" address="0x00002774" value="0x0000FFF1" />
+        <register type="OA" address="0x00002778" value="0x00028002" />
+        <register type="OA" address="0x0000277C" value="0x000087FF" />
+        <register type="OA" address="0x00002780" value="0x00020002" />
+        <register type="OA" address="0x00002784" value="0x00008FFF" />
+        <register type="OA" address="0x00002788" value="0x00008002" />
+        <register type="OA" address="0x0000278C" value="0x0000A7FF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set RasterizerAndPixelBackend"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="rasterizer_and_pixel_backend"
+       hw_config_guid="d2249ff7-34b4-4203-b474-7c11546f9dae"
+       chipset="SKLGT3"
+       symbol_name="RasterizerAndPixelBackend"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Slice0 Pixel Values Ready"
+             description="The percentage of time in which slice0 pixel values are ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="pixel_values0_ready"
+             units="percent"
+             symbol_name="PixelValues0Ready"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="Slice0 Rasterizer Input Available"
+             description="The percentage of time in which slice0 rasterizer input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="rasterizer0_input_available"
+             units="percent"
+             symbol_name="Rasterizer0InputAvailable"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Slice0 Post-EarlyZ Pixel Data Ready"
+             description="The percentage of time in which slice0 post-EarlyZ pixel data is ready (after early Z tests have been applied)"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="pixel_data0_ready"
+             units="percent"
+             symbol_name="PixelData0Ready"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer/Early Depth Test"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 Rasterizer Output Ready"
+             description="The percentage of time in which slice0 rasterizer output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="rasterizer0_output_ready"
+             units="percent"
+             symbol_name="Rasterizer0OutputReady"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Slice0 PS Output Available"
+             description="The percentage of time in which slice0 PS output is available"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_output0_available"
+             units="percent"
+             symbol_name="PSOutput0Available"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x102F3800" />
+        <register type="NOA" address="0x00009888" value="0x144D0500" />
+        <register type="NOA" address="0x00009888" value="0x120D03C0" />
+        <register type="NOA" address="0x00009888" value="0x140D03CF" />
+        <register type="NOA" address="0x00009888" value="0x0C0F0004" />
+        <register type="NOA" address="0x00009888" value="0x0C4E4000" />
+        <register type="NOA" address="0x00009888" value="0x042F0480" />
+        <register type="NOA" address="0x00009888" value="0x082F0000" />
+        <register type="NOA" address="0x00009888" value="0x022F0000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C0090" />
+        <register type="NOA" address="0x00009888" value="0x064D0027" />
+        <register type="NOA" address="0x00009888" value="0x004D0000" />
+        <register type="NOA" address="0x00009888" value="0x000D0D40" />
+        <register type="NOA" address="0x00009888" value="0x020D803F" />
+        <register type="NOA" address="0x00009888" value="0x040D8023" />
+        <register type="NOA" address="0x00009888" value="0x100D0000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x020F0010" />
+        <register type="NOA" address="0x00009888" value="0x000F0000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0050" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C2C8000" />
+        <register type="NOA" address="0x00009888" value="0x1190FC00" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41901400" />
+        <register type="NOA" address="0x00009888" value="0x43901485" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900001" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x30800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00000002" />
+        <register type="OA" address="0x00002774" value="0x0000EFFF" />
+        <register type="OA" address="0x00002778" value="0x00006000" />
+        <register type="OA" address="0x0000277C" value="0x0000F3FF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set Sampler"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="sampler"
+       hw_config_guid="c9cf7c63-0065-4226-941e-98590bad8f75"
+       chipset="SKLGT3"
+       symbol_name="Sampler"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 Subslice2 Input Available"
+             description="The percentage of time in which slice0 subslice2 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler02_input_available"
+             units="percent"
+             symbol_name="Sampler02InputAvailable"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 Subslice0 Input Available"
+             description="The percentage of time in which slice0 subslice0 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler00_input_available"
+             units="percent"
+             symbol_name="Sampler00InputAvailable"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="Slice0 Subslice2 Sampler Output Ready"
+             description="The percentage of time in which slice0 subslice2 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler02_output_ready"
+             units="percent"
+             symbol_name="Sampler02OutputReady"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Slice0 Subslice1 Input Available"
+             description="The percentage of time in which slice0 subslice1 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler01_input_available"
+             units="percent"
+             symbol_name="Sampler01InputAvailable"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Slice0 Subslice0 Sampler Output Ready"
+             description="The percentage of time in which slice0 subslice0 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler00_output_ready"
+             units="percent"
+             symbol_name="Sampler00OutputReady"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Slice0 Subslice1 Sampler Output Ready"
+             description="The percentage of time in which slice0 subslice1 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler01_output_ready"
+             units="percent"
+             symbol_name="Sampler01OutputReady"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x14152C00" />
+        <register type="NOA" address="0x00009888" value="0x16150005" />
+        <register type="NOA" address="0x00009888" value="0x121600A0" />
+        <register type="NOA" address="0x00009888" value="0x14352C00" />
+        <register type="NOA" address="0x00009888" value="0x16350005" />
+        <register type="NOA" address="0x00009888" value="0x123600A0" />
+        <register type="NOA" address="0x00009888" value="0x14552C00" />
+        <register type="NOA" address="0x00009888" value="0x16550005" />
+        <register type="NOA" address="0x00009888" value="0x125600A0" />
+        <register type="NOA" address="0x00009888" value="0x062F6000" />
+        <register type="NOA" address="0x00009888" value="0x022F2000" />
+        <register type="NOA" address="0x00009888" value="0x0C4C0050" />
+        <register type="NOA" address="0x00009888" value="0x0A4C0010" />
+        <register type="NOA" address="0x00009888" value="0x0C0D8000" />
+        <register type="NOA" address="0x00009888" value="0x0E0DA000" />
+        <register type="NOA" address="0x00009888" value="0x000D8000" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x100F0350" />
+        <register type="NOA" address="0x00009888" value="0x0C0FB000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F00DA" />
+        <register type="NOA" address="0x00009888" value="0x182C0028" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x022DC000" />
+        <register type="NOA" address="0x00009888" value="0x042D4000" />
+        <register type="NOA" address="0x00009888" value="0x0C138000" />
+        <register type="NOA" address="0x00009888" value="0x0E132000" />
+        <register type="NOA" address="0x00009888" value="0x0413C000" />
+        <register type="NOA" address="0x00009888" value="0x1C140018" />
+        <register type="NOA" address="0x00009888" value="0x0C157000" />
+        <register type="NOA" address="0x00009888" value="0x0E150078" />
+        <register type="NOA" address="0x00009888" value="0x10150000" />
+        <register type="NOA" address="0x00009888" value="0x04162180" />
+        <register type="NOA" address="0x00009888" value="0x02160000" />
+        <register type="NOA" address="0x00009888" value="0x04174000" />
+        <register type="NOA" address="0x00009888" value="0x0233A000" />
+        <register type="NOA" address="0x00009888" value="0x04333000" />
+        <register type="NOA" address="0x00009888" value="0x14348000" />
+        <register type="NOA" address="0x00009888" value="0x16348000" />
+        <register type="NOA" address="0x00009888" value="0x02357870" />
+        <register type="NOA" address="0x00009888" value="0x10350000" />
+        <register type="NOA" address="0x00009888" value="0x04360043" />
+        <register type="NOA" address="0x00009888" value="0x02360000" />
+        <register type="NOA" address="0x00009888" value="0x04371000" />
+        <register type="NOA" address="0x00009888" value="0x0E538000" />
+        <register type="NOA" address="0x00009888" value="0x00538000" />
+        <register type="NOA" address="0x00009888" value="0x06533000" />
+        <register type="NOA" address="0x00009888" value="0x1C540020" />
+        <register type="NOA" address="0x00009888" value="0x12548000" />
+        <register type="NOA" address="0x00009888" value="0x0E557000" />
+        <register type="NOA" address="0x00009888" value="0x00557800" />
+        <register type="NOA" address="0x00009888" value="0x10550000" />
+        <register type="NOA" address="0x00009888" value="0x06560043" />
+        <register type="NOA" address="0x00009888" value="0x02560000" />
+        <register type="NOA" address="0x00009888" value="0x06571000" />
+        <register type="NOA" address="0x00009888" value="0x1190FF80" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900060" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900C00" />
+        <register type="NOA" address="0x00009888" value="0x43900842" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900060" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x70800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x0000C000" />
+        <register type="OA" address="0x00002774" value="0x0000E7FF" />
+        <register type="OA" address="0x00002778" value="0x00003000" />
+        <register type="OA" address="0x0000277C" value="0x0000F9FF" />
+        <register type="OA" address="0x00002780" value="0x00000C00" />
+        <register type="OA" address="0x00002784" value="0x0000FE7F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set TDL_1"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="tdl_1"
+       hw_config_guid="e3bb1501-89ca-43fb-8668-9d96159e10a2"
+       chipset="SKLGT3"
+       symbol_name="TDL_1"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="NonPS Thread Ready For Dispatch on Slice0 Subslice2"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice2 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread02_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread02ReadyForDispatch"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="NonPS Thread Ready For Dispatch on Slice0 Subslice0"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice0 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread00_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread00ReadyForDispatch"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Subslice0"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice0 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread00_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread00ReadyForDispatch"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Subslice1"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice1 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread01_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread01ReadyForDispatch"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Subslice2"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice2 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread02_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread02ReadyForDispatch"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="NonPS Thread Ready For Dispatch on Slice0 Subslice1"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice1 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread01_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread01ReadyForDispatch"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x12120000" />
+        <register type="NOA" address="0x00009888" value="0x12320000" />
+        <register type="NOA" address="0x00009888" value="0x12520000" />
+        <register type="NOA" address="0x00009888" value="0x002F8000" />
+        <register type="NOA" address="0x00009888" value="0x022F3000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C0015" />
+        <register type="NOA" address="0x00009888" value="0x0C0D8000" />
+        <register type="NOA" address="0x00009888" value="0x0E0DA000" />
+        <register type="NOA" address="0x00009888" value="0x000D8000" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x100F03A0" />
+        <register type="NOA" address="0x00009888" value="0x0C0FF000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0095" />
+        <register type="NOA" address="0x00009888" value="0x062C8000" />
+        <register type="NOA" address="0x00009888" value="0x082C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C2D8000" />
+        <register type="NOA" address="0x00009888" value="0x0E2D4000" />
+        <register type="NOA" address="0x00009888" value="0x062D4000" />
+        <register type="NOA" address="0x00009888" value="0x02108000" />
+        <register type="NOA" address="0x00009888" value="0x0410C000" />
+        <register type="NOA" address="0x00009888" value="0x02118000" />
+        <register type="NOA" address="0x00009888" value="0x0411C000" />
+        <register type="NOA" address="0x00009888" value="0x02121880" />
+        <register type="NOA" address="0x00009888" value="0x041219B5" />
+        <register type="NOA" address="0x00009888" value="0x00120000" />
+        <register type="NOA" address="0x00009888" value="0x02134000" />
+        <register type="NOA" address="0x00009888" value="0x04135000" />
+        <register type="NOA" address="0x00009888" value="0x0C308000" />
+        <register type="NOA" address="0x00009888" value="0x0E304000" />
+        <register type="NOA" address="0x00009888" value="0x06304000" />
+        <register type="NOA" address="0x00009888" value="0x0C318000" />
+        <register type="NOA" address="0x00009888" value="0x0E314000" />
+        <register type="NOA" address="0x00009888" value="0x06314000" />
+        <register type="NOA" address="0x00009888" value="0x0C321A80" />
+        <register type="NOA" address="0x00009888" value="0x0E320033" />
+        <register type="NOA" address="0x00009888" value="0x06320031" />
+        <register type="NOA" address="0x00009888" value="0x00320000" />
+        <register type="NOA" address="0x00009888" value="0x0C334000" />
+        <register type="NOA" address="0x00009888" value="0x0E331000" />
+        <register type="NOA" address="0x00009888" value="0x06331000" />
+        <register type="NOA" address="0x00009888" value="0x0E508000" />
+        <register type="NOA" address="0x00009888" value="0x00508000" />
+        <register type="NOA" address="0x00009888" value="0x02504000" />
+        <register type="NOA" address="0x00009888" value="0x0E518000" />
+        <register type="NOA" address="0x00009888" value="0x00518000" />
+        <register type="NOA" address="0x00009888" value="0x02514000" />
+        <register type="NOA" address="0x00009888" value="0x0E521880" />
+        <register type="NOA" address="0x00009888" value="0x00521A80" />
+        <register type="NOA" address="0x00009888" value="0x02520033" />
+        <register type="NOA" address="0x00009888" value="0x0E534000" />
+        <register type="NOA" address="0x00009888" value="0x00534000" />
+        <register type="NOA" address="0x00009888" value="0x02531000" />
+        <register type="NOA" address="0x00009888" value="0x1190FF80" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900800" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900062" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900C00" />
+        <register type="NOA" address="0x00009888" value="0x43900003" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900040" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x30800000" />
+        <register type="OA" address="0x00002770" value="0x00000002" />
+        <register type="OA" address="0x00002774" value="0x00007FFF" />
+        <register type="OA" address="0x00002778" value="0x00000000" />
+        <register type="OA" address="0x0000277C" value="0x00009FFF" />
+        <register type="OA" address="0x00002780" value="0x00000002" />
+        <register type="OA" address="0x00002784" value="0x0000EFFF" />
+        <register type="OA" address="0x00002788" value="0x00000000" />
+        <register type="OA" address="0x0000278C" value="0x0000F3FF" />
+        <register type="OA" address="0x00002790" value="0x00000002" />
+        <register type="OA" address="0x00002794" value="0x0000FDFF" />
+        <register type="OA" address="0x00002798" value="0x00000000" />
+        <register type="OA" address="0x0000279C" value="0x0000FE7F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set TDL_2"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="tdl_2"
+       hw_config_guid="29194a55-7e75-4152-a71f-ef34b1ae4cca"
+       chipset="SKLGT3"
+       symbol_name="TDL_2"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice1 Port 0"
+             description="The percentage of time in which thread header is ready on slice0 subslice1 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header01_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader01ReadyPort0"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice1 Port 1"
+             description="The percentage of time in which thread header is ready on slice0 subslice1 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header01_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader01ReadyPort1"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice2 Port 1"
+             description="The percentage of time in which thread header is ready on slice0 subslice2 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header02_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader02ReadyPort1"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice2 Port 0"
+             description="The percentage of time in which thread header is ready on slice0 subslice2 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header02_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader02ReadyPort0"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice0 Port 0"
+             description="The percentage of time in which thread header is ready on slice0 subslice0 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header00_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader00ReadyPort0"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice0 Port 1"
+             description="The percentage of time in which thread header is ready on slice0 subslice0 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header00_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader00ReadyPort1"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x12124D60" />
+        <register type="NOA" address="0x00009888" value="0x12322E60" />
+        <register type="NOA" address="0x00009888" value="0x12524D60" />
+        <register type="NOA" address="0x00009888" value="0x022F3000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C0014" />
+        <register type="NOA" address="0x00009888" value="0x000D8000" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x0C0FE000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0097" />
+        <register type="NOA" address="0x00009888" value="0x082C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x002D8000" />
+        <register type="NOA" address="0x00009888" value="0x062D4000" />
+        <register type="NOA" address="0x00009888" value="0x0410C000" />
+        <register type="NOA" address="0x00009888" value="0x0411C000" />
+        <register type="NOA" address="0x00009888" value="0x04121FB7" />
+        <register type="NOA" address="0x00009888" value="0x00120000" />
+        <register type="NOA" address="0x00009888" value="0x04135000" />
+        <register type="NOA" address="0x00009888" value="0x00308000" />
+        <register type="NOA" address="0x00009888" value="0x06304000" />
+        <register type="NOA" address="0x00009888" value="0x00318000" />
+        <register type="NOA" address="0x00009888" value="0x06314000" />
+        <register type="NOA" address="0x00009888" value="0x00321B80" />
+        <register type="NOA" address="0x00009888" value="0x0632003F" />
+        <register type="NOA" address="0x00009888" value="0x00334000" />
+        <register type="NOA" address="0x00009888" value="0x06331000" />
+        <register type="NOA" address="0x00009888" value="0x0250C000" />
+        <register type="NOA" address="0x00009888" value="0x0251C000" />
+        <register type="NOA" address="0x00009888" value="0x02521FB7" />
+        <register type="NOA" address="0x00009888" value="0x00520000" />
+        <register type="NOA" address="0x00009888" value="0x02535000" />
+        <register type="NOA" address="0x00009888" value="0x1190FC00" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900800" />
+        <register type="NOA" address="0x00009888" value="0x43900063" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900040" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Compute Metrics Extra Gen9"
+       mdapi_supported_apis="VK OGL4 OCL IO BB"
+       underscore_name="compute_extra"
+       hw_config_guid="2d80a648-7b5a-4e92-bbe7-3b5c76f2e221"
+       chipset="SKLGT3"
+       symbol_name="ComputeExtra"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active"
+             units="percent"
+             symbol_name="Fpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Pipe Active including Ext Math"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing including Extended Math processing"
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ  C 5 READ C 6 READ FADD C 7 READ FADD C 2 READ FADD C 3 READ FADD C 4 READ FADD 8 FMUL FADD 100 FMUL $EuCoresTotalCount FDIV $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active_adjusted"
+             units="percent"
+             symbol_name="Fpu1ActiveAdjusted"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x121203E0" />
+        <register type="NOA" address="0x00009888" value="0x123203E0" />
+        <register type="NOA" address="0x00009888" value="0x125203E0" />
+        <register type="NOA" address="0x00009888" value="0x129203E0" />
+        <register type="NOA" address="0x00009888" value="0x12B203E0" />
+        <register type="NOA" address="0x00009888" value="0x12D203E0" />
+        <register type="NOA" address="0x00009888" value="0x024EC000" />
+        <register type="NOA" address="0x00009888" value="0x044EC000" />
+        <register type="NOA" address="0x00009888" value="0x064EC000" />
+        <register type="NOA" address="0x00009888" value="0x022F4000" />
+        <register type="NOA" address="0x00009888" value="0x084CA000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C0042" />
+        <register type="NOA" address="0x00009888" value="0x000D8000" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F5000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F006D" />
+        <register type="NOA" address="0x00009888" value="0x022C8000" />
+        <register type="NOA" address="0x00009888" value="0x042C8000" />
+        <register type="NOA" address="0x00009888" value="0x062C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C2C8000" />
+        <register type="NOA" address="0x00009888" value="0x042D8000" />
+        <register type="NOA" address="0x00009888" value="0x06104000" />
+        <register type="NOA" address="0x00009888" value="0x06114000" />
+        <register type="NOA" address="0x00009888" value="0x06120033" />
+        <register type="NOA" address="0x00009888" value="0x00120000" />
+        <register type="NOA" address="0x00009888" value="0x06131000" />
+        <register type="NOA" address="0x00009888" value="0x04308000" />
+        <register type="NOA" address="0x00009888" value="0x04318000" />
+        <register type="NOA" address="0x00009888" value="0x04321980" />
+        <register type="NOA" address="0x00009888" value="0x00320000" />
+        <register type="NOA" address="0x00009888" value="0x04334000" />
+        <register type="NOA" address="0x00009888" value="0x04504000" />
+        <register type="NOA" address="0x00009888" value="0x04514000" />
+        <register type="NOA" address="0x00009888" value="0x04520033" />
+        <register type="NOA" address="0x00009888" value="0x00520000" />
+        <register type="NOA" address="0x00009888" value="0x04531000" />
+        <register type="NOA" address="0x00009888" value="0x00AF8000" />
+        <register type="NOA" address="0x00009888" value="0x0ACC0001" />
+        <register type="NOA" address="0x00009888" value="0x008D8000" />
+        <register type="NOA" address="0x00009888" value="0x028DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C8FB000" />
+        <register type="NOA" address="0x00009888" value="0x0E8F0001" />
+        <register type="NOA" address="0x00009888" value="0x06AC8000" />
+        <register type="NOA" address="0x00009888" value="0x02AD4000" />
+        <register type="NOA" address="0x00009888" value="0x02908000" />
+        <register type="NOA" address="0x00009888" value="0x02918000" />
+        <register type="NOA" address="0x00009888" value="0x02921980" />
+        <register type="NOA" address="0x00009888" value="0x00920000" />
+        <register type="NOA" address="0x00009888" value="0x02934000" />
+        <register type="NOA" address="0x00009888" value="0x02B04000" />
+        <register type="NOA" address="0x00009888" value="0x02B14000" />
+        <register type="NOA" address="0x00009888" value="0x02B20033" />
+        <register type="NOA" address="0x00009888" value="0x00B20000" />
+        <register type="NOA" address="0x00009888" value="0x02B31000" />
+        <register type="NOA" address="0x00009888" value="0x00D08000" />
+        <register type="NOA" address="0x00009888" value="0x00D18000" />
+        <register type="NOA" address="0x00009888" value="0x00D21980" />
+        <register type="NOA" address="0x00009888" value="0x00D34000" />
+        <register type="NOA" address="0x00009888" value="0x1190FC00" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900C00" />
+        <register type="NOA" address="0x00009888" value="0x43900402" />
+        <register type="NOA" address="0x00009888" value="0x53901550" />
+        <register type="NOA" address="0x00009888" value="0x45900080" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+  </set>
+
+  <set name="Media Vme Pipe Gen9"
+       mdapi_supported_apis="MEDIA IO BB"
+       underscore_name="vme_pipe"
+       hw_config_guid="cfae9232-6ffc-42cc-a703-9790016925f0"
+       chipset="SKLGT3"
+       symbol_name="VMEPipe"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="EU Thread Occupancy"
+             description="The percentage of time in which hardware threads occupied EUs."
+             data_type="float"
+             max_equation="100"
+             equation="8 A 10 READ FMUL $EuThreadsCount FDIV $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_thread_occupancy"
+             units="percent"
+             symbol_name="EuThreadOccupancy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VME Busy"
+             description="The percentage of time in which VME (IME or CRE) was actively processing data."
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ B 3 READ FADD 2 FDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vme_busy"
+             units="percent"
+             symbol_name="VMEBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Overview System Batch Tier2"
+             mdapi_group="VME Pipe"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x141A5800" />
+        <register type="NOA" address="0x00009888" value="0x161A00C0" />
+        <register type="NOA" address="0x00009888" value="0x12180240" />
+        <register type="NOA" address="0x00009888" value="0x14180002" />
+        <register type="NOA" address="0x00009888" value="0x149A5800" />
+        <register type="NOA" address="0x00009888" value="0x169A00C0" />
+        <register type="NOA" address="0x00009888" value="0x12980240" />
+        <register type="NOA" address="0x00009888" value="0x14980002" />
+        <register type="NOA" address="0x00009888" value="0x1A4E3FC0" />
+        <register type="NOA" address="0x00009888" value="0x002F1000" />
+        <register type="NOA" address="0x00009888" value="0x022F8000" />
+        <register type="NOA" address="0x00009888" value="0x042F3000" />
+        <register type="NOA" address="0x00009888" value="0x004C4000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C9500" />
+        <register type="NOA" address="0x00009888" value="0x0C4C002A" />
+        <register type="NOA" address="0x00009888" value="0x000D2000" />
+        <register type="NOA" address="0x00009888" value="0x060D8000" />
+        <register type="NOA" address="0x00009888" value="0x080DA000" />
+        <register type="NOA" address="0x00009888" value="0x0A0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F0400" />
+        <register type="NOA" address="0x00009888" value="0x0E0F5500" />
+        <register type="NOA" address="0x00009888" value="0x100F0015" />
+        <register type="NOA" address="0x00009888" value="0x002C8000" />
+        <register type="NOA" address="0x00009888" value="0x0E2C8000" />
+        <register type="NOA" address="0x00009888" value="0x162CAA00" />
+        <register type="NOA" address="0x00009888" value="0x182C000A" />
+        <register type="NOA" address="0x00009888" value="0x04193000" />
+        <register type="NOA" address="0x00009888" value="0x081A28C1" />
+        <register type="NOA" address="0x00009888" value="0x001A0000" />
+        <register type="NOA" address="0x00009888" value="0x00133000" />
+        <register type="NOA" address="0x00009888" value="0x0613C000" />
+        <register type="NOA" address="0x00009888" value="0x0813F000" />
+        <register type="NOA" address="0x00009888" value="0x00172000" />
+        <register type="NOA" address="0x00009888" value="0x06178000" />
+        <register type="NOA" address="0x00009888" value="0x0817A000" />
+        <register type="NOA" address="0x00009888" value="0x00180037" />
+        <register type="NOA" address="0x00009888" value="0x06180940" />
+        <register type="NOA" address="0x00009888" value="0x08180000" />
+        <register type="NOA" address="0x00009888" value="0x02180000" />
+        <register type="NOA" address="0x00009888" value="0x04183000" />
+        <register type="NOA" address="0x00009888" value="0x04AFC000" />
+        <register type="NOA" address="0x00009888" value="0x06AF3000" />
+        <register type="NOA" address="0x00009888" value="0x0ACC4000" />
+        <register type="NOA" address="0x00009888" value="0x0CCC0015" />
+        <register type="NOA" address="0x00009888" value="0x0A8DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C8DA000" />
+        <register type="NOA" address="0x00009888" value="0x0E8F4000" />
+        <register type="NOA" address="0x00009888" value="0x108F0015" />
+        <register type="NOA" address="0x00009888" value="0x16ACA000" />
+        <register type="NOA" address="0x00009888" value="0x18AC000A" />
+        <register type="NOA" address="0x00009888" value="0x06993000" />
+        <register type="NOA" address="0x00009888" value="0x0C9A28C1" />
+        <register type="NOA" address="0x00009888" value="0x009A0000" />
+        <register type="NOA" address="0x00009888" value="0x0A93F000" />
+        <register type="NOA" address="0x00009888" value="0x0C93F000" />
+        <register type="NOA" address="0x00009888" value="0x0A97A000" />
+        <register type="NOA" address="0x00009888" value="0x0C97A000" />
+        <register type="NOA" address="0x00009888" value="0x0A980977" />
+        <register type="NOA" address="0x00009888" value="0x08980000" />
+        <register type="NOA" address="0x00009888" value="0x04980000" />
+        <register type="NOA" address="0x00009888" value="0x06983000" />
+        <register type="NOA" address="0x00009888" value="0x119000FF" />
+        <register type="NOA" address="0x00009888" value="0x51900050" />
+        <register type="NOA" address="0x00009888" value="0x41900000" />
+        <register type="NOA" address="0x00009888" value="0x55900115" />
+        <register type="NOA" address="0x00009888" value="0x45900000" />
+        <register type="NOA" address="0x00009888" value="0x47900884" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900002" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x30800000" />
+        <register type="OA" address="0x00002770" value="0x00100030" />
+        <register type="OA" address="0x00002774" value="0x0000FFF9" />
+        <register type="OA" address="0x00002778" value="0x00000002" />
+        <register type="OA" address="0x0000277C" value="0x0000FFFC" />
+        <register type="OA" address="0x00002780" value="0x00000002" />
+        <register type="OA" address="0x00002784" value="0x0000FFF3" />
+        <register type="OA" address="0x00002788" value="0x00100180" />
+        <register type="OA" address="0x0000278C" value="0x0000FFCF" />
+        <register type="OA" address="0x00002790" value="0x00000002" />
+        <register type="OA" address="0x00002794" value="0x0000FFCF" />
+        <register type="OA" address="0x00002798" value="0x00000002" />
+        <register type="OA" address="0x0000279C" value="0x0000FF3F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00008003" />
+    </register_config>
+  </set>
+
+  <set name="Gpu Rings Busyness"
+       mdapi_supported_apis="VK OGL OCL MEDIA IO BB"
+       underscore_name="gpu_busyness"
+       hw_config_guid="0c5058ff-fdf4-4e0d-81fb-c0310fb76525"
+       chipset="SKLGT3"
+       symbol_name="GpuBusyness"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="Vebox Ring Busy"
+             description="The percentage of time when vebox command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vebox_busy"
+             units="percent"
+             symbol_name="VeboxBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Render Ring Busy"
+             description="The percentage of time when render command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="render_busy"
+             units="percent"
+             symbol_name="RenderBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Vdbox0 Ring Busy"
+             description="The percentage of time when Vdbox0 command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vdbox0_busy"
+             units="percent"
+             symbol_name="Vdbox0Busy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Blitter Ring Busy"
+             description="The percentage of time when blitter command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="blitter_busy"
+             units="percent"
+             symbol_name="BlitterBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="AnyRingBusy"
+             description="The percentage of time when any command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="any_ring_busy"
+             units="percent"
+             symbol_name="AnyRingBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Vdbox1 Ring Busy"
+             description="The percentage of time when Vdbox1 command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vdbox1_busy"
+             units="percent"
+             symbol_name="Vdbox1Busy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x21D05800" />
+        <register type="NOA" address="0x00009888" value="0x13805800" />
+        <register type="NOA" address="0x00009888" value="0x05962C25" />
+        <register type="NOA" address="0x00009888" value="0x19950016" />
+        <register type="NOA" address="0x00009888" value="0x21C05800" />
+        <register type="NOA" address="0x00009888" value="0x09D000A5" />
+        <register type="NOA" address="0x00009888" value="0x11D00000" />
+        <register type="NOA" address="0x00009888" value="0x05D00000" />
+        <register type="NOA" address="0x00009888" value="0x09D54000" />
+        <register type="NOA" address="0x00009888" value="0x07800035" />
+        <register type="NOA" address="0x00009888" value="0x11800000" />
+        <register type="NOA" address="0x00009888" value="0x1D810400" />
+        <register type="NOA" address="0x00009888" value="0x21960000" />
+        <register type="NOA" address="0x00009888" value="0x0996C000" />
+        <register type="NOA" address="0x00009888" value="0x0B964000" />
+        <register type="NOA" address="0x00009888" value="0x19938000" />
+        <register type="NOA" address="0x00009888" value="0x1B930068" />
+        <register type="NOA" address="0x00009888" value="0x15948000" />
+        <register type="NOA" address="0x00009888" value="0x1B94000C" />
+        <register type="NOA" address="0x00009888" value="0x03957500" />
+        <register type="NOA" address="0x00009888" value="0x1D950000" />
+        <register type="NOA" address="0x00009888" value="0x17950000" />
+        <register type="NOA" address="0x00009888" value="0x07E54000" />
+        <register type="NOA" address="0x00009888" value="0x07928000" />
+        <register type="NOA" address="0x00009888" value="0x03988000" />
+        <register type="NOA" address="0x00009888" value="0x17908000" />
+        <register type="NOA" address="0x00009888" value="0x19904000" />
+        <register type="NOA" address="0x00009888" value="0x1B908000" />
+        <register type="NOA" address="0x00009888" value="0x1D908000" />
+        <register type="NOA" address="0x00009888" value="0x1F908000" />
+        <register type="NOA" address="0x00009888" value="0x09978000" />
+        <register type="NOA" address="0x00009888" value="0x0BC000A5" />
+        <register type="NOA" address="0x00009888" value="0x11C00000" />
+        <register type="NOA" address="0x00009888" value="0x05C00000" />
+        <register type="NOA" address="0x00009888" value="0x0BC54000" />
+        <register type="NOA" address="0x00009888" value="0x11900000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x43900463" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900040" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x10800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x0007C000" />
+        <register type="OA" address="0x00002774" value="0x000007FF" />
+    </register_config>
+  </set>
+
+  <set name="MDAPI testing set Gen9"
+       mdapi_supported_apis="VK OGL OCL IO BB"
+       underscore_name="test_oa"
+       hw_config_guid="2b985803-d3c9-4629-8a4f-634bfecba0e8"
+       chipset="SKLGT3"
+       symbol_name="TestOa"
+       >
+    <counter name="TestCounter7"
+             description="HW test counter 7. Factor: 0.666"
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="counter7"
+             units="events"
+             symbol_name="Counter7"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="TestCounter8"
+             description="HW test counter 8. Should be equal to 1."
+             data_type="uint64"
+             equation="C 7 READ"
+             underscore_name="counter8"
+             units="events"
+             symbol_name="Counter8"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter4"
+             description="HW test counter 4. Factor: 0.333"
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="counter4"
+             units="events"
+             symbol_name="Counter4"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter5"
+             description="HW test counter 5. Factor: 0.333"
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="counter5"
+             units="events"
+             symbol_name="Counter5"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter6"
+             description="HW test counter 6. Factor: 0.166"
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="counter6"
+             units="events"
+             symbol_name="Counter6"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter3"
+             description="HW test counter 3. Factor: 0.5"
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="counter3"
+             units="events"
+             symbol_name="Counter3"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter0"
+             description="HW test counter 0. Factor: 0.0"
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="counter0"
+             units="events"
+             symbol_name="Counter0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter1"
+             description="HW test counter 1. Factor: 1.0"
+             data_type="uint64"
+             equation="B 1 READ"
+             underscore_name="counter1"
+             units="events"
+             symbol_name="Counter1"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter2"
+             description="HW test counter 2. Factor: 1.0"
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="counter2"
+             units="events"
+             symbol_name="Counter2"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x11810000" />
+        <register type="NOA" address="0x00009888" value="0x07810013" />
+        <register type="NOA" address="0x00009888" value="0x1F810000" />
+        <register type="NOA" address="0x00009888" value="0x1D810000" />
+        <register type="NOA" address="0x00009888" value="0x1B930040" />
+        <register type="NOA" address="0x00009888" value="0x07E54000" />
+        <register type="NOA" address="0x00009888" value="0x1F908000" />
+        <register type="NOA" address="0x00009888" value="0x11900000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x00000004" />
+        <register type="OA" address="0x00002774" value="0x00000000" />
+        <register type="OA" address="0x00002778" value="0x00000003" />
+        <register type="OA" address="0x0000277C" value="0x00000000" />
+        <register type="OA" address="0x00002780" value="0x00000007" />
+        <register type="OA" address="0x00002784" value="0x00000000" />
+        <register type="OA" address="0x00002788" value="0x00100002" />
+        <register type="OA" address="0x0000278C" value="0x0000FFF7" />
+        <register type="OA" address="0x00002790" value="0x00100002" />
+        <register type="OA" address="0x00002794" value="0x0000FFCF" />
+        <register type="OA" address="0x00002798" value="0x00100082" />
+        <register type="OA" address="0x0000279C" value="0x0000FFEF" />
+        <register type="OA" address="0x000027A0" value="0x001000C2" />
+        <register type="OA" address="0x000027A4" value="0x0000FFE7" />
+        <register type="OA" address="0x000027A8" value="0x00100001" />
+        <register type="OA" address="0x000027AC" value="0x0000FFE7" />
+    </register_config>
+  </set>
+
+  <set name="Metric set PMA Stall"
+       mdapi_supported_apis="VK OGL OGL4 OCL IO MEDIA"
+       underscore_name="pma__stall"
+       hw_config_guid="c889fd93-8dc7-4ba5-9451-de34a8b5ea3f"
+       chipset="SKLGT3"
+       symbol_name="PMA_Stall"
+       >
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="STC PMA stall"
+             description="Percentage of time when stencil cache line and an overlapping pixel are causing stalls"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ B 1 READ FADD 2 FDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="stc_pma_stall"
+             units="percent"
+             symbol_name="StcPMAStall"
+             availability="$SliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_group="GPU/Stencil Cache"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x122D3080" />
+        <register type="NOA" address="0x00009888" value="0x000D2000" />
+        <register type="NOA" address="0x00009888" value="0x060D8000" />
+        <register type="NOA" address="0x00009888" value="0x080DA000" />
+        <register type="NOA" address="0x00009888" value="0x0A0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F0800" />
+        <register type="NOA" address="0x00009888" value="0x0E0FAA00" />
+        <register type="NOA" address="0x00009888" value="0x100F0002" />
+        <register type="NOA" address="0x00009888" value="0x002D0025" />
+        <register type="NOA" address="0x00009888" value="0x062D1300" />
+        <register type="NOA" address="0x00009888" value="0x082D16A4" />
+        <register type="NOA" address="0x00009888" value="0x0A2D162E" />
+        <register type="NOA" address="0x00009888" value="0x102D0000" />
+        <register type="NOA" address="0x00009888" value="0x1190003F" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900000" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900000" />
+        <register type="NOA" address="0x00009888" value="0x47900000" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x30800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00E00021" />
+        <register type="OA" address="0x00002774" value="0x0007FFF8" />
+        <register type="OA" address="0x00002778" value="0x07000101" />
+        <register type="OA" address="0x0000277C" value="0x0038FFC7" />
+    </register_config>
+  </set>
+
+</metrics>
diff --git a/lib/i915/perf-configs/oa-sklgt4.xml b/lib/i915/perf-configs/oa-sklgt4.xml
new file mode 100644
index 00000000..94f6a633
--- /dev/null
+++ b/lib/i915/perf-configs/oa-sklgt4.xml
@@ -0,0 +1,10956 @@
+<?xml version="1.0"?>
+<metrics version="1581935519" merge_md5="">
+  <set name="Render Metrics Basic Gen9"
+       mdapi_supported_apis="VK VK OGL OCL IO BB"
+       underscore_name="render_basic"
+       hw_config_guid="95322a71-bb05-4437-bc27-f7dd7b27d136"
+       chipset="SKLGT4"
+       symbol_name="RenderBasic"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Misses"
+             description="The total number of L3 misses."
+             data_type="uint64"
+             equation="C 4 READ"
+             underscore_name="l3_misses"
+             units="messages"
+             symbol_name="L3Misses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/TAG"
+             />
+    <counter name="GTI L3 Throughput"
+             description="The total number of GPU memory bytes transferred between L3 caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="$L3Misses 64 UMUL"
+             underscore_name="gti_l3_throughput"
+             units="bytes"
+             symbol_name="GtiL3Throughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Cache Misses"
+             description="The total number of sampler cache misses in all LODs in all sampler units."
+             data_type="uint64"
+             equation="B 4 READ B 5 READ UADD B 3 READ UADD 8 UMUL"
+             underscore_name="sampler_l1_misses"
+             units="messages"
+             symbol_name="SamplerL1Misses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="L3 Sampler Throughput"
+             description="The total number of GPU memory bytes transferred between samplers and L3 caches."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="$SamplerL1Misses 64 UMUL"
+             underscore_name="l3_sampler_throughput"
+             units="bytes"
+             symbol_name="L3SamplerThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Sampler"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Sampler 0 Busy"
+             description="The percentage of time in which Sampler 0 has been processing EU requests."
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler0_busy"
+             units="percent"
+             symbol_name="Sampler0Busy"
+             availability="$SubsliceMask 0x09 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Sampler 1 Busy"
+             description="The percentage of time in which Sampler 1 has been processing EU requests."
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler1_busy"
+             units="percent"
+             symbol_name="Sampler1Busy"
+             availability="$SubsliceMask 0x12 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Samplers Busy"
+             description="The percentage of time in which samplers have been processing EU requests."
+             data_type="float"
+             max_equation="100"
+             equation="$Sampler0Busy $Sampler1Busy FMAX"
+             underscore_name="samplers_busy"
+             units="percent"
+             symbol_name="SamplersBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="GTI Fixed Pipe Throughput"
+             description="The total number of GPU memory bytes transferred between 3D Pipeline (Command Dispatch, Input Assembly and Stream Output) and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="B 6 READ B 7 READ UADD 64 UMUL"
+             underscore_name="gti_vf_throughput"
+             units="bytes"
+             symbol_name="GtiVfThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/3D Pipe"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler 0 Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which Sampler 0 has been slowing down the pipe when processing EU requests."
+             data_type="float"
+             high_watermark="15"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="sampler0_bottleneck"
+             units="percent"
+             symbol_name="Sampler0Bottleneck"
+             availability="$SubsliceMask 0x09 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="L3 Lookup Accesses w/o IC"
+             description="The total number of L3 cache lookup accesses w/o IC."
+             data_type="uint64"
+             equation="$SamplerL1Misses $ShaderMemoryAccesses UADD"
+             underscore_name="l3_lookups"
+             units="messages"
+             symbol_name="L3Lookups"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/TAG"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Read Throughput"
+             description="The total number of GPU memory bytes read from GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="C 6 READ 64 UMUL"
+             underscore_name="gti_read_throughput"
+             units="bytes"
+             symbol_name="GtiReadThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Depth Throughput"
+             description="The total number of GPU memory bytes transferred between depth caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 0 READ C 1 READ UADD 64 UMUL"
+             underscore_name="gti_depth_throughput"
+             units="bytes"
+             symbol_name="GtiDepthThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/Depth Cache"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Samplers Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which samplers have been slowing down the pipe when processing EU requests."
+             data_type="float"
+             high_watermark="15"
+             equation="$Sampler0Bottleneck"
+             max_equation="100"
+             underscore_name="sampler_bottleneck"
+             units="percent"
+             symbol_name="SamplerBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Indicate System Frame Batch Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="GTI HDC TLB Lookup Throughput"
+             description="The total number of GPU memory bytes transferred between GTI and HDC, when HDC is doing TLB lookups."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 5 READ 64 UMUL"
+             underscore_name="gti_hdc_lookups_throughput"
+             units="bytes"
+             symbol_name="GtiHdcLookupsThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI RCC Throughput"
+             description="The total number of GPU memory bytes transferred between render color caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 2 READ C 3 READ UADD 64 UMUL"
+             underscore_name="gti_rcc_throughput"
+             units="bytes"
+             symbol_name="GtiRccThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/Color Cache"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="GTI Write Throughput"
+             description="The total number of GPU memory bytes written to GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 32 UMUL"
+             equation="C 7 READ 64 UMUL"
+             underscore_name="gti_write_throughput"
+             units="bytes"
+             symbol_name="GtiWriteThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x166C01E0" />
+        <register type="NOA" address="0x00009888" value="0x12170280" />
+        <register type="NOA" address="0x00009888" value="0x12370280" />
+        <register type="NOA" address="0x00009888" value="0x16EC01E0" />
+        <register type="NOA" address="0x00009888" value="0x176C01E0" />
+        <register type="NOA" address="0x00009888" value="0x11930317" />
+        <register type="NOA" address="0x00009888" value="0x159303DF" />
+        <register type="NOA" address="0x00009888" value="0x3F900003" />
+        <register type="NOA" address="0x00009888" value="0x1A4E03B0" />
+        <register type="NOA" address="0x00009888" value="0x0A6C0053" />
+        <register type="NOA" address="0x00009888" value="0x106C0000" />
+        <register type="NOA" address="0x00009888" value="0x1C6C0000" />
+        <register type="NOA" address="0x00009888" value="0x0A1B4000" />
+        <register type="NOA" address="0x00009888" value="0x1C1C0001" />
+        <register type="NOA" address="0x00009888" value="0x002F1000" />
+        <register type="NOA" address="0x00009888" value="0x042F1000" />
+        <register type="NOA" address="0x00009888" value="0x004C4000" />
+        <register type="NOA" address="0x00009888" value="0x0A4CA400" />
+        <register type="NOA" address="0x00009888" value="0x0C4C0002" />
+        <register type="NOA" address="0x00009888" value="0x000D2000" />
+        <register type="NOA" address="0x00009888" value="0x060D8000" />
+        <register type="NOA" address="0x00009888" value="0x080DA000" />
+        <register type="NOA" address="0x00009888" value="0x0A0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F0400" />
+        <register type="NOA" address="0x00009888" value="0x0E0F5600" />
+        <register type="NOA" address="0x00009888" value="0x100F0001" />
+        <register type="NOA" address="0x00009888" value="0x002C8000" />
+        <register type="NOA" address="0x00009888" value="0x162CAA00" />
+        <register type="NOA" address="0x00009888" value="0x062D8000" />
+        <register type="NOA" address="0x00009888" value="0x00133000" />
+        <register type="NOA" address="0x00009888" value="0x08133000" />
+        <register type="NOA" address="0x00009888" value="0x00170020" />
+        <register type="NOA" address="0x00009888" value="0x08170021" />
+        <register type="NOA" address="0x00009888" value="0x10170000" />
+        <register type="NOA" address="0x00009888" value="0x0633C000" />
+        <register type="NOA" address="0x00009888" value="0x06370800" />
+        <register type="NOA" address="0x00009888" value="0x10370000" />
+        <register type="NOA" address="0x00009888" value="0x1ACE0230" />
+        <register type="NOA" address="0x00009888" value="0x0AEC5300" />
+        <register type="NOA" address="0x00009888" value="0x10EC0000" />
+        <register type="NOA" address="0x00009888" value="0x1CEC0000" />
+        <register type="NOA" address="0x00009888" value="0x0A9B8000" />
+        <register type="NOA" address="0x00009888" value="0x1C9C0002" />
+        <register type="NOA" address="0x00009888" value="0x0ACC2000" />
+        <register type="NOA" address="0x00009888" value="0x0CCC0002" />
+        <register type="NOA" address="0x00009888" value="0x088D8000" />
+        <register type="NOA" address="0x00009888" value="0x0A8D8000" />
+        <register type="NOA" address="0x00009888" value="0x0E8F1000" />
+        <register type="NOA" address="0x00009888" value="0x108F0001" />
+        <register type="NOA" address="0x00009888" value="0x16AC8800" />
+        <register type="NOA" address="0x00009888" value="0x1B4E0020" />
+        <register type="NOA" address="0x00009888" value="0x096C5300" />
+        <register type="NOA" address="0x00009888" value="0x116C0000" />
+        <register type="NOA" address="0x00009888" value="0x1D6C0000" />
+        <register type="NOA" address="0x00009888" value="0x091B8000" />
+        <register type="NOA" address="0x00009888" value="0x1B1C8000" />
+        <register type="NOA" address="0x00009888" value="0x0B4C2000" />
+        <register type="NOA" address="0x00009888" value="0x090D8000" />
+        <register type="NOA" address="0x00009888" value="0x0F0F1000" />
+        <register type="NOA" address="0x00009888" value="0x172C0800" />
+        <register type="NOA" address="0x00009888" value="0x0D933031" />
+        <register type="NOA" address="0x00009888" value="0x0F933E3F" />
+        <register type="NOA" address="0x00009888" value="0x01933D00" />
+        <register type="NOA" address="0x00009888" value="0x0393073C" />
+        <register type="NOA" address="0x00009888" value="0x0593000E" />
+        <register type="NOA" address="0x00009888" value="0x1D930000" />
+        <register type="NOA" address="0x00009888" value="0x19930000" />
+        <register type="NOA" address="0x00009888" value="0x1B930000" />
+        <register type="NOA" address="0x00009888" value="0x1D900157" />
+        <register type="NOA" address="0x00009888" value="0x1F900158" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x2B908000" />
+        <register type="NOA" address="0x00009888" value="0x2D908000" />
+        <register type="NOA" address="0x00009888" value="0x2F908000" />
+        <register type="NOA" address="0x00009888" value="0x31908000" />
+        <register type="NOA" address="0x00009888" value="0x15908000" />
+        <register type="NOA" address="0x00009888" value="0x17908000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B908000" />
+        <register type="NOA" address="0x00009888" value="0x1190003F" />
+        <register type="NOA" address="0x00009888" value="0x5190FF30" />
+        <register type="NOA" address="0x00009888" value="0x41900060" />
+        <register type="NOA" address="0x00009888" value="0x55903033" />
+        <register type="NOA" address="0x00009888" value="0x45901421" />
+        <register type="NOA" address="0x00009888" value="0x47900803" />
+        <register type="NOA" address="0x00009888" value="0x5790FFF1" />
+        <register type="NOA" address="0x00009888" value="0x49900001" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900000" />
+        <register type="NOA" address="0x00009888" value="0x5990000F" />
+        <register type="NOA" address="0x00009888" value="0x43900000" />
+        <register type="NOA" address="0x00009888" value="0x5390FFFF" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00222222" />
+    </register_config>
+  </set>
+
+  <set name="Compute Metrics Basic Gen9"
+       mdapi_supported_apis="VK VK OGL4 OCL IO BB"
+       underscore_name="compute_basic"
+       hw_config_guid="7277228f-e7f3-4743-945a-6a2049d11377"
+       chipset="SKLGT4"
+       symbol_name="ComputeBasic"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Untyped Bytes Read"
+             description="The total number of typed memory bytes read via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="B 6 READ B 7 READ C 0 READ UADD UADD $EuSlicesTotalCount 64 UMUL UMUL"
+             underscore_name="untyped_bytes_read"
+             units="bytes"
+             symbol_name="UntypedBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Typed Bytes Written"
+             description="The total number of untyped memory bytes written via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="B 3 READ B 4 READ B 5 READ UADD UADD $EuSlicesTotalCount 64 UMUL UMUL"
+             underscore_name="typed_bytes_written"
+             units="bytes"
+             symbol_name="TypedBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu0_active"
+             units="percent"
+             symbol_name="Fpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active"
+             units="percent"
+             symbol_name="Fpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL IO OCL BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU AVG IPC Rate"
+             description="The average rate of IPC calculated for 2 FPU pipelines."
+             data_type="float"
+             max_equation="2"
+             equation="A 9 READ  A 10 READ  A 11 READ UADD  A 9 READ USUB FDIV 1 FADD"
+             underscore_name="eu_avg_ipc_rate"
+             units="number"
+             symbol_name="EuAvgIpcRate"
+             semantic_type="ratio"
+             mdapi_supported_apis="VK VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO OCL BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO OCL BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Read Throughput"
+             description="The total number of GPU memory bytes read from GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 4 READ 64 UMUL"
+             underscore_name="gti_read_throughput"
+             units="bytes"
+             symbol_name="GtiReadThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Untyped Writes"
+             description="The total number of untyped memory bytes written via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 1 READ C 2 READ C 3 READ UADD UADD $EuSlicesTotalCount 64 UMUL UMUL"
+             underscore_name="untyped_bytes_written"
+             units="bytes"
+             symbol_name="UntypedBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO OCL BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="Typed Bytes Read"
+             description="The total number of typed memory bytes read via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="B 0 READ B 1 READ B 2 READ UADD UADD $EuSlicesTotalCount 64 UMUL UMUL"
+             underscore_name="typed_bytes_read"
+             units="bytes"
+             symbol_name="TypedBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="EU Thread Occupancy"
+             description="The percentage of time in which hardware threads occupied EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ 8 UMUL $EuCoresTotalCount UDIV $EuThreadsCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_thread_occupancy"
+             units="percent"
+             symbol_name="EuThreadOccupancy"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL IO OCL BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO OCL BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO OCL BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="GTI Write Throughput"
+             description="The total number of GPU memory bytes written to GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 32 UMUL"
+             equation="C 5 READ 64 UMUL"
+             underscore_name="gti_write_throughput"
+             units="bytes"
+             symbol_name="GtiWriteThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO OCL BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO OCL BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="EU Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_send_active"
+             units="percent"
+             symbol_name="EuSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL IO OCL BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x104F00E0" />
+        <register type="NOA" address="0x00009888" value="0x124F1C00" />
+        <register type="NOA" address="0x00009888" value="0x106C00E0" />
+        <register type="NOA" address="0x00009888" value="0x37906800" />
+        <register type="NOA" address="0x00009888" value="0x3F900003" />
+        <register type="NOA" address="0x00009888" value="0x004E8000" />
+        <register type="NOA" address="0x00009888" value="0x1A4E0820" />
+        <register type="NOA" address="0x00009888" value="0x1C4E0002" />
+        <register type="NOA" address="0x00009888" value="0x064F0900" />
+        <register type="NOA" address="0x00009888" value="0x084F0032" />
+        <register type="NOA" address="0x00009888" value="0x0A4F1891" />
+        <register type="NOA" address="0x00009888" value="0x0C4F0E00" />
+        <register type="NOA" address="0x00009888" value="0x0E4F003C" />
+        <register type="NOA" address="0x00009888" value="0x004F0D80" />
+        <register type="NOA" address="0x00009888" value="0x024F003B" />
+        <register type="NOA" address="0x00009888" value="0x006C0002" />
+        <register type="NOA" address="0x00009888" value="0x086C0100" />
+        <register type="NOA" address="0x00009888" value="0x0C6C000C" />
+        <register type="NOA" address="0x00009888" value="0x0E6C0B00" />
+        <register type="NOA" address="0x00009888" value="0x186C0000" />
+        <register type="NOA" address="0x00009888" value="0x1C6C0000" />
+        <register type="NOA" address="0x00009888" value="0x1E6C0000" />
+        <register type="NOA" address="0x00009888" value="0x001B4000" />
+        <register type="NOA" address="0x00009888" value="0x081B8000" />
+        <register type="NOA" address="0x00009888" value="0x0C1B4000" />
+        <register type="NOA" address="0x00009888" value="0x0E1B8000" />
+        <register type="NOA" address="0x00009888" value="0x101C8000" />
+        <register type="NOA" address="0x00009888" value="0x1A1C8000" />
+        <register type="NOA" address="0x00009888" value="0x1C1C0024" />
+        <register type="NOA" address="0x00009888" value="0x065B8000" />
+        <register type="NOA" address="0x00009888" value="0x085B4000" />
+        <register type="NOA" address="0x00009888" value="0x0A5BC000" />
+        <register type="NOA" address="0x00009888" value="0x0C5B8000" />
+        <register type="NOA" address="0x00009888" value="0x0E5B4000" />
+        <register type="NOA" address="0x00009888" value="0x005B8000" />
+        <register type="NOA" address="0x00009888" value="0x025B4000" />
+        <register type="NOA" address="0x00009888" value="0x1A5C6000" />
+        <register type="NOA" address="0x00009888" value="0x1C5C001B" />
+        <register type="NOA" address="0x00009888" value="0x125C8000" />
+        <register type="NOA" address="0x00009888" value="0x145C8000" />
+        <register type="NOA" address="0x00009888" value="0x004C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C2000" />
+        <register type="NOA" address="0x00009888" value="0x0C4C0208" />
+        <register type="NOA" address="0x00009888" value="0x000DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D8000" />
+        <register type="NOA" address="0x00009888" value="0x080DA000" />
+        <register type="NOA" address="0x00009888" value="0x0A0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0E0DA000" />
+        <register type="NOA" address="0x00009888" value="0x020D2000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F5400" />
+        <register type="NOA" address="0x00009888" value="0x0E0F5500" />
+        <register type="NOA" address="0x00009888" value="0x100F0155" />
+        <register type="NOA" address="0x00009888" value="0x002C8000" />
+        <register type="NOA" address="0x00009888" value="0x0E2CC000" />
+        <register type="NOA" address="0x00009888" value="0x162CFB00" />
+        <register type="NOA" address="0x00009888" value="0x182C00BE" />
+        <register type="NOA" address="0x00009888" value="0x022CC000" />
+        <register type="NOA" address="0x00009888" value="0x042CC000" />
+        <register type="NOA" address="0x00009888" value="0x19900157" />
+        <register type="NOA" address="0x00009888" value="0x1B900158" />
+        <register type="NOA" address="0x00009888" value="0x1D900105" />
+        <register type="NOA" address="0x00009888" value="0x1F900103" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x11900FFF" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900800" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900821" />
+        <register type="NOA" address="0x00009888" value="0x47900802" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900802" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900002" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x43900422" />
+        <register type="NOA" address="0x00009888" value="0x53905555" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00000003" />
+        <register type="FLEX" address="0x0000E658" value="0x00002001" />
+        <register type="FLEX" address="0x0000E758" value="0x00778008" />
+        <register type="FLEX" address="0x0000E45C" value="0x00088078" />
+        <register type="FLEX" address="0x0000E55C" value="0x00808708" />
+        <register type="FLEX" address="0x0000E65C" value="0x00A08908" />
+    </register_config>
+  </set>
+
+  <set name="Render Metrics for 3D Pipeline Profile Gen9"
+       mdapi_supported_apis="VK VK OGL OCL IO BB"
+       underscore_name="render_pipe_profile"
+       hw_config_guid="463c668c-3f60-49b6-8f85-d995b635b3b2"
+       chipset="SKLGT4"
+       symbol_name="RenderPipeProfile"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Bottleneck"
+             low_watermark="10"
+             description="The percentage of time in which vertex shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="30"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_bottleneck"
+             units="percent"
+             symbol_name="VsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Hi-Depth Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which early hierarchical depth test pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="hi_depth_bottleneck"
+             units="percent"
+             symbol_name="HiDepthBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which geometry shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gs_bottleneck"
+             units="percent"
+             symbol_name="GsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Geometry Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="BC Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which barycentric coordinates calculation pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="bc_bottleneck"
+             units="percent"
+             symbol_name="BcBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Barycentric Calc"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HS Stall"
+             description="The percentage of time in which hull stall pipeline stage was stalled."
+             data_type="float"
+             equation="C 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="hs_stall"
+             units="percent"
+             symbol_name="HsStall"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL4 IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Hull Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="VF Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which vertex fetch pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="C 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vf_bottleneck"
+             units="percent"
+             symbol_name="VfBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Input Assembler"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Strip-Fans Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which strip-fans pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="10"
+             equation="B 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sf_bottleneck"
+             units="percent"
+             symbol_name="SfBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Strip-Fans"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SF Stall"
+             description="The percentage of time in which strip-fans pipeline stage was stalled."
+             data_type="float"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sf_stall"
+             units="percent"
+             symbol_name="SfStall"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Strip-Fans"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HS Bottleneck"
+             low_watermark="3"
+             description="The percentage of time in which hull shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="9"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="hs_bottleneck"
+             units="percent"
+             symbol_name="HsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Hull Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="CL Stall"
+             description="The percentage of time in which clipper pipeline stage was stalled."
+             data_type="float"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="cl_stall"
+             units="percent"
+             symbol_name="ClStall"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Clipper"
+             />
+    <counter name="SO Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which stream output pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="so_bottleneck"
+             units="percent"
+             symbol_name="SoBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Stream Output"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="DS Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which domain shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ds_bottleneck"
+             units="percent"
+             symbol_name="DsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Domain Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Clipper Bottleneck"
+             low_watermark="10"
+             description="The percentage of time in which clipper pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="30"
+             equation="B 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="cl_bottleneck"
+             units="percent"
+             symbol_name="ClBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Clipper"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Stall"
+             description="The percentage of time in which domain shader pipeline stage was stalled."
+             data_type="float"
+             equation="C 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ds_stall"
+             units="percent"
+             symbol_name="DsStall"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL4 IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Domain Shader"
+             />
+    <counter name="Early Depth Bottleneck"
+             low_watermark="10"
+             description="The percentage of time in which early depth test pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="30"
+             equation="B 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="early_depth_bottleneck"
+             units="percent"
+             symbol_name="EarlyDepthBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="SO Stall"
+             description="The percentage of time in which stream-output pipeline stage was stalled."
+             data_type="float"
+             equation="C 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="so_stall"
+             units="percent"
+             symbol_name="SoStall"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Stream Output"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x0C0E001F" />
+        <register type="NOA" address="0x00009888" value="0x0A0F0000" />
+        <register type="NOA" address="0x00009888" value="0x10116800" />
+        <register type="NOA" address="0x00009888" value="0x178A03E0" />
+        <register type="NOA" address="0x00009888" value="0x11824C00" />
+        <register type="NOA" address="0x00009888" value="0x11830020" />
+        <register type="NOA" address="0x00009888" value="0x13840020" />
+        <register type="NOA" address="0x00009888" value="0x11850019" />
+        <register type="NOA" address="0x00009888" value="0x11860007" />
+        <register type="NOA" address="0x00009888" value="0x01870C40" />
+        <register type="NOA" address="0x00009888" value="0x17880000" />
+        <register type="NOA" address="0x00009888" value="0x022F4000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C0040" />
+        <register type="NOA" address="0x00009888" value="0x0C0D8000" />
+        <register type="NOA" address="0x00009888" value="0x040D4000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x020E5400" />
+        <register type="NOA" address="0x00009888" value="0x000E0000" />
+        <register type="NOA" address="0x00009888" value="0x080F0040" />
+        <register type="NOA" address="0x00009888" value="0x000F0000" />
+        <register type="NOA" address="0x00009888" value="0x100F0000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0040" />
+        <register type="NOA" address="0x00009888" value="0x0C2C8000" />
+        <register type="NOA" address="0x00009888" value="0x06104000" />
+        <register type="NOA" address="0x00009888" value="0x06110012" />
+        <register type="NOA" address="0x00009888" value="0x06131000" />
+        <register type="NOA" address="0x00009888" value="0x01898000" />
+        <register type="NOA" address="0x00009888" value="0x0D890100" />
+        <register type="NOA" address="0x00009888" value="0x03898000" />
+        <register type="NOA" address="0x00009888" value="0x09808000" />
+        <register type="NOA" address="0x00009888" value="0x0B808000" />
+        <register type="NOA" address="0x00009888" value="0x0380C000" />
+        <register type="NOA" address="0x00009888" value="0x0F8A0075" />
+        <register type="NOA" address="0x00009888" value="0x1D8A0000" />
+        <register type="NOA" address="0x00009888" value="0x118A8000" />
+        <register type="NOA" address="0x00009888" value="0x1B8A4000" />
+        <register type="NOA" address="0x00009888" value="0x138A8000" />
+        <register type="NOA" address="0x00009888" value="0x1D81A000" />
+        <register type="NOA" address="0x00009888" value="0x15818000" />
+        <register type="NOA" address="0x00009888" value="0x17818000" />
+        <register type="NOA" address="0x00009888" value="0x0B820030" />
+        <register type="NOA" address="0x00009888" value="0x07828000" />
+        <register type="NOA" address="0x00009888" value="0x0D824000" />
+        <register type="NOA" address="0x00009888" value="0x0F828000" />
+        <register type="NOA" address="0x00009888" value="0x05824000" />
+        <register type="NOA" address="0x00009888" value="0x0D830003" />
+        <register type="NOA" address="0x00009888" value="0x0583000C" />
+        <register type="NOA" address="0x00009888" value="0x09830000" />
+        <register type="NOA" address="0x00009888" value="0x03838000" />
+        <register type="NOA" address="0x00009888" value="0x07838000" />
+        <register type="NOA" address="0x00009888" value="0x0B840980" />
+        <register type="NOA" address="0x00009888" value="0x03844D80" />
+        <register type="NOA" address="0x00009888" value="0x11840000" />
+        <register type="NOA" address="0x00009888" value="0x09848000" />
+        <register type="NOA" address="0x00009888" value="0x09850080" />
+        <register type="NOA" address="0x00009888" value="0x03850003" />
+        <register type="NOA" address="0x00009888" value="0x01850000" />
+        <register type="NOA" address="0x00009888" value="0x07860000" />
+        <register type="NOA" address="0x00009888" value="0x0F860400" />
+        <register type="NOA" address="0x00009888" value="0x09870032" />
+        <register type="NOA" address="0x00009888" value="0x01888052" />
+        <register type="NOA" address="0x00009888" value="0x11880000" />
+        <register type="NOA" address="0x00009888" value="0x09884000" />
+        <register type="NOA" address="0x00009888" value="0x1B931001" />
+        <register type="NOA" address="0x00009888" value="0x1D930001" />
+        <register type="NOA" address="0x00009888" value="0x19934000" />
+        <register type="NOA" address="0x00009888" value="0x1B958000" />
+        <register type="NOA" address="0x00009888" value="0x1D950094" />
+        <register type="NOA" address="0x00009888" value="0x19958000" />
+        <register type="NOA" address="0x00009888" value="0x09E58000" />
+        <register type="NOA" address="0x00009888" value="0x0BE58000" />
+        <register type="NOA" address="0x00009888" value="0x03E5C000" />
+        <register type="NOA" address="0x00009888" value="0x0592C000" />
+        <register type="NOA" address="0x00009888" value="0x0B928000" />
+        <register type="NOA" address="0x00009888" value="0x0D924000" />
+        <register type="NOA" address="0x00009888" value="0x0F924000" />
+        <register type="NOA" address="0x00009888" value="0x11928000" />
+        <register type="NOA" address="0x00009888" value="0x1392C000" />
+        <register type="NOA" address="0x00009888" value="0x09924000" />
+        <register type="NOA" address="0x00009888" value="0x01985000" />
+        <register type="NOA" address="0x00009888" value="0x07988000" />
+        <register type="NOA" address="0x00009888" value="0x09981000" />
+        <register type="NOA" address="0x00009888" value="0x0B982000" />
+        <register type="NOA" address="0x00009888" value="0x0D982000" />
+        <register type="NOA" address="0x00009888" value="0x0F989000" />
+        <register type="NOA" address="0x00009888" value="0x05982000" />
+        <register type="NOA" address="0x00009888" value="0x13904000" />
+        <register type="NOA" address="0x00009888" value="0x21904000" />
+        <register type="NOA" address="0x00009888" value="0x23904000" />
+        <register type="NOA" address="0x00009888" value="0x25908000" />
+        <register type="NOA" address="0x00009888" value="0x27904000" />
+        <register type="NOA" address="0x00009888" value="0x29908000" />
+        <register type="NOA" address="0x00009888" value="0x2B904000" />
+        <register type="NOA" address="0x00009888" value="0x2F904000" />
+        <register type="NOA" address="0x00009888" value="0x31904000" />
+        <register type="NOA" address="0x00009888" value="0x15904000" />
+        <register type="NOA" address="0x00009888" value="0x17908000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B904000" />
+        <register type="NOA" address="0x00009888" value="0x1190C080" />
+        <register type="NOA" address="0x00009888" value="0x51901110" />
+        <register type="NOA" address="0x00009888" value="0x41900440" />
+        <register type="NOA" address="0x00009888" value="0x55901111" />
+        <register type="NOA" address="0x00009888" value="0x45900400" />
+        <register type="NOA" address="0x00009888" value="0x47900C21" />
+        <register type="NOA" address="0x00009888" value="0x57901411" />
+        <register type="NOA" address="0x00009888" value="0x49900042" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900024" />
+        <register type="NOA" address="0x00009888" value="0x59900001" />
+        <register type="NOA" address="0x00009888" value="0x43900841" />
+        <register type="NOA" address="0x00009888" value="0x53900411" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007FFEA" />
+        <register type="OA" address="0x00002774" value="0x00007FFC" />
+        <register type="OA" address="0x00002778" value="0x0007AFFA" />
+        <register type="OA" address="0x0000277C" value="0x0000F5FD" />
+        <register type="OA" address="0x00002780" value="0x00079FFA" />
+        <register type="OA" address="0x00002784" value="0x0000F3FB" />
+        <register type="OA" address="0x00002788" value="0x0007BF7A" />
+        <register type="OA" address="0x0000278C" value="0x0000F7E7" />
+        <register type="OA" address="0x00002790" value="0x0007FEFA" />
+        <register type="OA" address="0x00002794" value="0x0000F7CF" />
+        <register type="OA" address="0x00002798" value="0x00077FFA" />
+        <register type="OA" address="0x0000279C" value="0x0000EFDF" />
+        <register type="OA" address="0x000027A0" value="0x0006FFFA" />
+        <register type="OA" address="0x000027A4" value="0x0000CFBF" />
+        <register type="OA" address="0x000027A8" value="0x0003FFFA" />
+        <register type="OA" address="0x000027AC" value="0x00005F7F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00015014" />
+        <register type="FLEX" address="0x0000E658" value="0x00025024" />
+        <register type="FLEX" address="0x0000E758" value="0x00035034" />
+        <register type="FLEX" address="0x0000E45C" value="0x00045044" />
+        <register type="FLEX" address="0x0000E55C" value="0x00055054" />
+        <register type="FLEX" address="0x0000E65C" value="0x00065064" />
+    </register_config>
+  </set>
+
+  <set name="Memory Reads Distribution Gen9"
+       mdapi_supported_apis="VK VK OGL OCL IO BB"
+       underscore_name="memory_reads"
+       hw_config_guid="3ae6e74c-72c3-4040-9bd0-7961430b8cc8"
+       chipset="SKLGT4"
+       symbol_name="MemoryReads"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiL3Bank0Reads"
+             description="The total number of GTI memory reads from L3 Bank 0 (L3 Cache misses)."
+             data_type="uint64"
+             equation="C 4 READ"
+             underscore_name="gti_l3_bank0_reads"
+             units="messages"
+             symbol_name="GtiL3Bank0Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="GtiRingAccesses"
+             description="The total number of all accesses from GTI to the ring."
+             data_type="uint64"
+             equation="C 3 READ 2 UMUL"
+             underscore_name="gti_ring_accesses"
+             units="messages"
+             symbol_name="GtiRingAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="GtiL3Bank3Reads"
+             description="The total number of GTI memory reads from L3 Bank 3 (L3 Cache misses)."
+             data_type="uint64"
+             equation="C 7 READ"
+             underscore_name="gti_l3_bank3_reads"
+             units="messages"
+             symbol_name="GtiL3Bank3Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="GtiRsMemoryReads"
+             description="The total number of GTI memory reads from Resource Streamer."
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="gti_rs_memory_reads"
+             units="messages"
+             symbol_name="GtiRsMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Resource Streamer"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GtiHizMemoryReads"
+             description="The total number of GTI memory reads from Hierarchical Depth Cache (Hi-Depth Cache misses)."
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="gti_hiz_memory_reads"
+             units="messages"
+             symbol_name="GtiHizMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="GtiRccMemoryReads"
+             description="The total number of GTI memory reads from Render Color Cache (Render Color Cache misses)."
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="gti_rcc_memory_reads"
+             units="messages"
+             symbol_name="GtiRccMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Color Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiL3Bank1Reads"
+             description="The total number of GTI memory reads from L3 Bank 1 (L3 Cache misses)."
+             data_type="uint64"
+             equation="C 5 READ"
+             underscore_name="gti_l3_bank1_reads"
+             units="messages"
+             symbol_name="GtiL3Bank1Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiCmdStreamerMemoryReads"
+             description="The total number of GTI memory reads from Command Streamer."
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="gti_cmd_streamer_memory_reads"
+             units="messages"
+             symbol_name="GtiCmdStreamerMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Command Streamer"
+             />
+    <counter name="GtiL3Bank2Reads"
+             description="The total number of GTI memory reads from L3 Bank 2 (L3 Cache misses)."
+             data_type="uint64"
+             equation="C 6 READ"
+             underscore_name="gti_l3_bank2_reads"
+             units="messages"
+             symbol_name="GtiL3Bank2Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiMemoryReads"
+             description="The total number of GTI memory reads."
+             data_type="uint64"
+             equation="C 0 READ"
+             underscore_name="gti_memory_reads"
+             units="messages"
+             symbol_name="GtiMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="GtiRczMemoryReads"
+             description="The total number of GTI memory reads from Render Depth Cache (Render Depth Cache misses)."
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="gti_rcz_memory_reads"
+             units="messages"
+             symbol_name="GtiRczMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="GtiMscMemoryReads"
+             description="The total number of GTI memory reads from Multisampling Color Cache (Multisampling Color Cache misses)."
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="gti_msc_memory_reads"
+             units="messages"
+             symbol_name="GtiMscMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Color Cache"
+             />
+    <counter name="GtiVfMemoryReads"
+             description="The total number of GTI memory reads from Vertex Fetch."
+             data_type="uint64"
+             equation="B 1 READ"
+             underscore_name="gti_vf_memory_reads"
+             units="messages"
+             symbol_name="GtiVfMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Vertex Fetch"
+             />
+    <counter name="GtiStcMemoryReads"
+             description="The total number of GTI memory reads from Stencil Cache (Stencil Cache misses)."
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="gti_stc_memory_reads"
+             units="messages"
+             symbol_name="GtiStcMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiL3Reads"
+             description="The total number of GTI memory reads from L3 (L3 Cache misses)."
+             data_type="uint64"
+             equation="$GtiL3Bank0Reads $GtiL3Bank1Reads $GtiL3Bank2Reads $GtiL3Bank3Reads UADD UADD UADD"
+             underscore_name="gti_l3_reads"
+             units="messages"
+             symbol_name="GtiL3Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x11810C00" />
+        <register type="NOA" address="0x00009888" value="0x1381001A" />
+        <register type="NOA" address="0x00009888" value="0x37906800" />
+        <register type="NOA" address="0x00009888" value="0x3F900064" />
+        <register type="NOA" address="0x00009888" value="0x03811300" />
+        <register type="NOA" address="0x00009888" value="0x05811B12" />
+        <register type="NOA" address="0x00009888" value="0x0781001A" />
+        <register type="NOA" address="0x00009888" value="0x1F810000" />
+        <register type="NOA" address="0x00009888" value="0x17810000" />
+        <register type="NOA" address="0x00009888" value="0x19810000" />
+        <register type="NOA" address="0x00009888" value="0x1B810000" />
+        <register type="NOA" address="0x00009888" value="0x1D810000" />
+        <register type="NOA" address="0x00009888" value="0x1B930055" />
+        <register type="NOA" address="0x00009888" value="0x03E58000" />
+        <register type="NOA" address="0x00009888" value="0x05E5C000" />
+        <register type="NOA" address="0x00009888" value="0x07E54000" />
+        <register type="NOA" address="0x00009888" value="0x13900150" />
+        <register type="NOA" address="0x00009888" value="0x21900151" />
+        <register type="NOA" address="0x00009888" value="0x23900152" />
+        <register type="NOA" address="0x00009888" value="0x25900153" />
+        <register type="NOA" address="0x00009888" value="0x27900154" />
+        <register type="NOA" address="0x00009888" value="0x29900155" />
+        <register type="NOA" address="0x00009888" value="0x2B900156" />
+        <register type="NOA" address="0x00009888" value="0x2D900157" />
+        <register type="NOA" address="0x00009888" value="0x2F90015F" />
+        <register type="NOA" address="0x00009888" value="0x31900105" />
+        <register type="NOA" address="0x00009888" value="0x15900103" />
+        <register type="NOA" address="0x00009888" value="0x17900101" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B908000" />
+        <register type="NOA" address="0x00009888" value="0x1D908000" />
+        <register type="NOA" address="0x00009888" value="0x1F908000" />
+        <register type="NOA" address="0x00009888" value="0x11900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900C60" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900C00" />
+        <register type="NOA" address="0x00009888" value="0x47900C63" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900C63" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900063" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x43900003" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x0000272C" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002728" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x0000271C" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002718" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x0000274C" value="0x86543210" />
+        <register type="OA" address="0x00002748" value="0x86543210" />
+        <register type="OA" address="0x00002744" value="0x00006667" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x0000275C" value="0x86543210" />
+        <register type="OA" address="0x00002758" value="0x86543210" />
+        <register type="OA" address="0x00002754" value="0x00006465" />
+        <register type="OA" address="0x00002750" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007F81A" />
+        <register type="OA" address="0x00002774" value="0x0000FE00" />
+        <register type="OA" address="0x00002778" value="0x0007F82A" />
+        <register type="OA" address="0x0000277C" value="0x0000FE00" />
+        <register type="OA" address="0x00002780" value="0x0007F872" />
+        <register type="OA" address="0x00002784" value="0x0000FE00" />
+        <register type="OA" address="0x00002788" value="0x0007F8BA" />
+        <register type="OA" address="0x0000278C" value="0x0000FE00" />
+        <register type="OA" address="0x00002790" value="0x0007F87A" />
+        <register type="OA" address="0x00002794" value="0x0000FE00" />
+        <register type="OA" address="0x00002798" value="0x0007F8EA" />
+        <register type="OA" address="0x0000279C" value="0x0000FE00" />
+        <register type="OA" address="0x000027A0" value="0x0007F8E2" />
+        <register type="OA" address="0x000027A4" value="0x0000FE00" />
+        <register type="OA" address="0x000027A8" value="0x0007F8F2" />
+        <register type="OA" address="0x000027AC" value="0x0000FE00" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00015014" />
+        <register type="FLEX" address="0x0000E658" value="0x00025024" />
+        <register type="FLEX" address="0x0000E758" value="0x00035034" />
+        <register type="FLEX" address="0x0000E45C" value="0x00045044" />
+        <register type="FLEX" address="0x0000E55C" value="0x00055054" />
+        <register type="FLEX" address="0x0000E65C" value="0x00065064" />
+    </register_config>
+  </set>
+
+  <set name="Memory Writes Distribution Gen9"
+       mdapi_supported_apis="VK VK OGL OCL IO BB"
+       underscore_name="memory_writes"
+       hw_config_guid="055f256d-4052-467c-8dec-6064a4806433"
+       chipset="SKLGT4"
+       symbol_name="MemoryWrites"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiMemoryWrites"
+             description="The total number of GTI memory writes."
+             data_type="uint64"
+             equation="C 0 READ"
+             underscore_name="gti_memory_writes"
+             units="messages"
+             symbol_name="GtiMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="GtiRingAccesses"
+             description="The total number of all GTI accesses to the ring."
+             data_type="uint64"
+             equation="C 3 READ 2 UMUL"
+             underscore_name="gti_ring_accesses"
+             units="messages"
+             symbol_name="GtiRingAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="GtiMscMemoryWrites"
+             description="The total number of GTI memory writes from Multisampling Color Cache (Multisampling Color Cache invalidations)."
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="gti_msc_memory_writes"
+             units="messages"
+             symbol_name="GtiMscMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Color Cache"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="GtiCmdStreamerMemoryWrites"
+             description="The total number of GTI memory writes from Command Streamer."
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="gti_cmd_streamer_memory_writes"
+             units="messages"
+             symbol_name="GtiCmdStreamerMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Command Streamer"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GtiL3Bank0Writes"
+             description="The total number of GTI memory writes from L3 Bank 0 (L3 Bank 0 invalidations)."
+             data_type="uint64"
+             equation="C 4 READ"
+             underscore_name="gti_l3_bank0_writes"
+             units="messages"
+             symbol_name="GtiL3Bank0Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiL3Bank1Writes"
+             description="The total number of GTI memory writes from L3 Bank 1 (L3 Bank 1 invalidations)."
+             data_type="uint64"
+             equation="C 5 READ"
+             underscore_name="gti_l3_bank1_writes"
+             units="messages"
+             symbol_name="GtiL3Bank1Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiL3Bank2Writes"
+             description="The total number of GTI memory writes from L3 Bank 2 (L3 Bank 2 invalidations)."
+             data_type="uint64"
+             equation="C 6 READ"
+             underscore_name="gti_l3_bank2_writes"
+             units="messages"
+             symbol_name="GtiL3Bank2Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiL3Bank3Writes"
+             description="The total number of GTI memory writes from L3 Bank 3 (L3 Bank 3 invalidations)."
+             data_type="uint64"
+             equation="C 7 READ"
+             underscore_name="gti_l3_bank3_writes"
+             units="messages"
+             symbol_name="GtiL3Bank3Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiL3Writes"
+             description="The total number of GTI memory writes from L3 (L3 invalidations)."
+             data_type="uint64"
+             equation="$GtiL3Bank0Writes $GtiL3Bank1Writes $GtiL3Bank2Writes $GtiL3Bank3Writes UADD UADD UADD"
+             underscore_name="gti_l3_writes"
+             units="messages"
+             symbol_name="GtiL3Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiRccMemoryWrites"
+             description="The total number of GTI memory writes from Render Color Cache (Render Color Cache invalidations)."
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="gti_rcc_memory_writes"
+             units="messages"
+             symbol_name="GtiRccMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Color Cache"
+             />
+    <counter name="GtiSoMemoryWrites"
+             description="The total number of GTI memory writes from Stream Output."
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="gti_so_memory_writes"
+             units="messages"
+             symbol_name="GtiSoMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Stream Output"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiStcMemoryWrites"
+             description="The total number of GTI memory writes from Stencil Cache."
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="gti_stc_memory_writes"
+             units="messages"
+             symbol_name="GtiStcMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="GtiRczMemoryWrites"
+             description="The total number of GTI memory writes from Render Depth Cache."
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="gti_rcz_memory_writes"
+             units="messages"
+             symbol_name="GtiRczMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="GtiHizMemoryWrites"
+             description="The total number of GTI memory writes from Hierarchical Depth Cache."
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="gti_hiz_memory_writes"
+             units="messages"
+             symbol_name="GtiHizMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x11810C00" />
+        <register type="NOA" address="0x00009888" value="0x1381001A" />
+        <register type="NOA" address="0x00009888" value="0x37906800" />
+        <register type="NOA" address="0x00009888" value="0x3F901000" />
+        <register type="NOA" address="0x00009888" value="0x03811300" />
+        <register type="NOA" address="0x00009888" value="0x05811B12" />
+        <register type="NOA" address="0x00009888" value="0x0781001A" />
+        <register type="NOA" address="0x00009888" value="0x1F810000" />
+        <register type="NOA" address="0x00009888" value="0x17810000" />
+        <register type="NOA" address="0x00009888" value="0x19810000" />
+        <register type="NOA" address="0x00009888" value="0x1B810000" />
+        <register type="NOA" address="0x00009888" value="0x1D810000" />
+        <register type="NOA" address="0x00009888" value="0x1B930055" />
+        <register type="NOA" address="0x00009888" value="0x03E58000" />
+        <register type="NOA" address="0x00009888" value="0x05E5C000" />
+        <register type="NOA" address="0x00009888" value="0x07E54000" />
+        <register type="NOA" address="0x00009888" value="0x13900160" />
+        <register type="NOA" address="0x00009888" value="0x21900161" />
+        <register type="NOA" address="0x00009888" value="0x23900162" />
+        <register type="NOA" address="0x00009888" value="0x25900163" />
+        <register type="NOA" address="0x00009888" value="0x27900164" />
+        <register type="NOA" address="0x00009888" value="0x29900165" />
+        <register type="NOA" address="0x00009888" value="0x2B900166" />
+        <register type="NOA" address="0x00009888" value="0x2D900167" />
+        <register type="NOA" address="0x00009888" value="0x2F900150" />
+        <register type="NOA" address="0x00009888" value="0x31900105" />
+        <register type="NOA" address="0x00009888" value="0x15900103" />
+        <register type="NOA" address="0x00009888" value="0x17900101" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B908000" />
+        <register type="NOA" address="0x00009888" value="0x1D908000" />
+        <register type="NOA" address="0x00009888" value="0x1F908000" />
+        <register type="NOA" address="0x00009888" value="0x11900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900C60" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900C00" />
+        <register type="NOA" address="0x00009888" value="0x47900C63" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900C63" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900063" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x43900003" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x0000272C" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002728" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x0000271C" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002718" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x0000274C" value="0x86543210" />
+        <register type="OA" address="0x00002748" value="0x86543210" />
+        <register type="OA" address="0x00002744" value="0x00006667" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x0000275C" value="0x86543210" />
+        <register type="OA" address="0x00002758" value="0x86543210" />
+        <register type="OA" address="0x00002754" value="0x00006465" />
+        <register type="OA" address="0x00002750" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007F81A" />
+        <register type="OA" address="0x00002774" value="0x0000FE00" />
+        <register type="OA" address="0x00002778" value="0x0007F82A" />
+        <register type="OA" address="0x0000277C" value="0x0000FE00" />
+        <register type="OA" address="0x00002780" value="0x0007F822" />
+        <register type="OA" address="0x00002784" value="0x0000FE00" />
+        <register type="OA" address="0x00002788" value="0x0007F8BA" />
+        <register type="OA" address="0x0000278C" value="0x0000FE00" />
+        <register type="OA" address="0x00002790" value="0x0007F87A" />
+        <register type="OA" address="0x00002794" value="0x0000FE00" />
+        <register type="OA" address="0x00002798" value="0x0007F8EA" />
+        <register type="OA" address="0x0000279C" value="0x0000FE00" />
+        <register type="OA" address="0x000027A0" value="0x0007F8E2" />
+        <register type="OA" address="0x000027A4" value="0x0000FE00" />
+        <register type="OA" address="0x000027A8" value="0x0007F8F2" />
+        <register type="OA" address="0x000027AC" value="0x0000FE00" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00015014" />
+        <register type="FLEX" address="0x0000E658" value="0x00025024" />
+        <register type="FLEX" address="0x0000E758" value="0x00035034" />
+        <register type="FLEX" address="0x0000E45C" value="0x00045044" />
+        <register type="FLEX" address="0x0000E55C" value="0x00055054" />
+        <register type="FLEX" address="0x0000E65C" value="0x00065064" />
+    </register_config>
+  </set>
+
+  <set name="Compute Metrics Extended Gen9"
+       mdapi_supported_apis="VK VK OGL4 OCL IO BB"
+       underscore_name="compute_extended"
+       hw_config_guid="753972d4-87cd-4460-824d-754463ac5054"
+       chipset="SKLGT4"
+       symbol_name="ComputeExtended"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu0_active"
+             units="percent"
+             symbol_name="Fpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active"
+             units="percent"
+             symbol_name="Fpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU AVG IPC Rate"
+             description="The average rate of IPC calculated for 2 FPU pipelines."
+             data_type="float"
+             max_equation="2"
+             equation="A 9 READ  A 10 READ  A 11 READ UADD  A 9 READ USUB FDIV 1 FADD"
+             underscore_name="eu_avg_ipc_rate"
+             units="number"
+             symbol_name="EuAvgIpcRate"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Typed Writes 0"
+             description="The subslice 0 typed writes."
+             data_type="uint64"
+             equation="C 0 READ"
+             underscore_name="typed_writes0"
+             units="messages"
+             symbol_name="TypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuTypedAtomics0"
+             description="The subslice 0 EU Typed Atomics subslice 0."
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="eu_typed_atomics0"
+             units="messages"
+             symbol_name="EuTypedAtomics0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Typed Atomics 0"
+             description="The subslice 0 typed atomics."
+             data_type="uint64"
+             equation="C 4 READ"
+             underscore_name="typed_atomics0"
+             units="messages"
+             symbol_name="TypedAtomics0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="TypedAtomicsPerCacheLine"
+             description="The ratio of EU typed atomics requests to L3 cache line writes."
+             data_type="float"
+             equation="$EuTypedAtomics0 $TypedAtomics0 FDIV"
+             underscore_name="typed_atomics_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="TypedAtomicsPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuUntypedReads0"
+             description="The subslice 0 EU Untyped Reads subslice 0."
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="eu_untyped_reads0"
+             units="messages"
+             symbol_name="EuUntypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Untyped Writes 0"
+             description="The subslice 0 untyped writes (including SLM writes)."
+             data_type="uint64"
+             equation="C 1 READ"
+             underscore_name="untyped_writes0"
+             units="messages"
+             symbol_name="UntypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuUntypedAtomics0"
+             description="The subslice 0 EU Untyped Atomics subslice 0."
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="eu_untyped_atomics0"
+             units="messages"
+             symbol_name="EuUntypedAtomics0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuUntypedWrites0"
+             description="The subslice 0 EU Untyped Writes subslice 0."
+             data_type="uint64"
+             equation="B 1 READ"
+             underscore_name="eu_untyped_writes0"
+             units="messages"
+             symbol_name="EuUntypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuA64UntypedWrites0"
+             description="The subslice 0 EU A64 Untyped Writes subslice 0."
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="eu_a64_untyped_writes0"
+             units="messages"
+             symbol_name="EuA64UntypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="UntypedWritesPerCacheLine"
+             description="The ratio of EU untyped write requests to L3 cache line writes."
+             data_type="float"
+             equation="$EuUntypedWrites0 $EuA64UntypedWrites0 UADD $UntypedWrites0 FDIV"
+             underscore_name="untyped_writes_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="UntypedWritesPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EuTypedWrites0"
+             description="The subslice 0 EU Typed Writes subslice 0."
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="eu_typed_writes0"
+             units="messages"
+             symbol_name="EuTypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="TypedWritesPerCacheLine"
+             description="The ratio of EU typed write requests to L3 cache line writes."
+             data_type="float"
+             equation="$EuTypedWrites0 $TypedWrites0 FDIV"
+             underscore_name="typed_writes_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="TypedWritesPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Typed Reads 0"
+             description="The subslice 0 typed reads."
+             data_type="uint64"
+             equation="C 2 READ"
+             underscore_name="typed_reads0"
+             units="messages"
+             symbol_name="TypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Untyped Reads 0"
+             description="The subslice 0 untyped reads (including SLM reads)."
+             data_type="uint64"
+             equation="C 3 READ"
+             underscore_name="untyped_reads0"
+             units="messages"
+             symbol_name="UntypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuA64UntypedReads0"
+             description="The subslice 0 EU A64 Untyped Reads subslice 0."
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="eu_a64_untyped_reads0"
+             units="messages"
+             symbol_name="EuA64UntypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EU Thread Occupancy"
+             description="The percentage of time in which hardware threads occupied EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ 8 UMUL $EuCoresTotalCount UDIV $EuThreadsCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_thread_occupancy"
+             units="percent"
+             symbol_name="EuThreadOccupancy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EuTypedReads0"
+             description="The subslice 0 EU Typed Reads subslice 0."
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="eu_typed_reads0"
+             units="messages"
+             symbol_name="EuTypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="UntypedReadsPerCacheLine"
+             description="The ratio of EU untyped read requests to L3 cache line reads."
+             data_type="float"
+             equation="$EuUntypedReads0 $EuA64UntypedReads0 UADD $UntypedReads0 FDIV"
+             underscore_name="untyped_reads_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="UntypedReadsPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="TypedReadsPerCacheLine"
+             description="The ratio of EU typed read requests to L3 cache line reads."
+             data_type="float"
+             equation="$EuTypedReads0 $TypedReads0 FDIV"
+             underscore_name="typed_reads_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="TypedReadsPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="EU Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_send_active"
+             units="percent"
+             symbol_name="EuSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x106C00E0" />
+        <register type="NOA" address="0x00009888" value="0x141C8160" />
+        <register type="NOA" address="0x00009888" value="0x161C8015" />
+        <register type="NOA" address="0x00009888" value="0x181C0120" />
+        <register type="NOA" address="0x00009888" value="0x004E8000" />
+        <register type="NOA" address="0x00009888" value="0x0E4E8000" />
+        <register type="NOA" address="0x00009888" value="0x184E8000" />
+        <register type="NOA" address="0x00009888" value="0x1A4EAAA0" />
+        <register type="NOA" address="0x00009888" value="0x1C4E0002" />
+        <register type="NOA" address="0x00009888" value="0x024E8000" />
+        <register type="NOA" address="0x00009888" value="0x044E8000" />
+        <register type="NOA" address="0x00009888" value="0x064E8000" />
+        <register type="NOA" address="0x00009888" value="0x084E8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4E8000" />
+        <register type="NOA" address="0x00009888" value="0x0E6C0B01" />
+        <register type="NOA" address="0x00009888" value="0x006C0200" />
+        <register type="NOA" address="0x00009888" value="0x026C000C" />
+        <register type="NOA" address="0x00009888" value="0x1C6C0000" />
+        <register type="NOA" address="0x00009888" value="0x1E6C0000" />
+        <register type="NOA" address="0x00009888" value="0x1A6C0000" />
+        <register type="NOA" address="0x00009888" value="0x0E1BC000" />
+        <register type="NOA" address="0x00009888" value="0x001B8000" />
+        <register type="NOA" address="0x00009888" value="0x021BC000" />
+        <register type="NOA" address="0x00009888" value="0x001C0041" />
+        <register type="NOA" address="0x00009888" value="0x061C4200" />
+        <register type="NOA" address="0x00009888" value="0x081C4443" />
+        <register type="NOA" address="0x00009888" value="0x0A1C4645" />
+        <register type="NOA" address="0x00009888" value="0x0C1C7647" />
+        <register type="NOA" address="0x00009888" value="0x041C7357" />
+        <register type="NOA" address="0x00009888" value="0x1C1C0030" />
+        <register type="NOA" address="0x00009888" value="0x101C0000" />
+        <register type="NOA" address="0x00009888" value="0x1A1C0000" />
+        <register type="NOA" address="0x00009888" value="0x121C8000" />
+        <register type="NOA" address="0x00009888" value="0x004C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4CAA2A" />
+        <register type="NOA" address="0x00009888" value="0x0C4C02AA" />
+        <register type="NOA" address="0x00009888" value="0x084CA000" />
+        <register type="NOA" address="0x00009888" value="0x000DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D8000" />
+        <register type="NOA" address="0x00009888" value="0x080DA000" />
+        <register type="NOA" address="0x00009888" value="0x0A0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0E0DA000" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F5400" />
+        <register type="NOA" address="0x00009888" value="0x0E0F5515" />
+        <register type="NOA" address="0x00009888" value="0x100F0155" />
+        <register type="NOA" address="0x00009888" value="0x002C8000" />
+        <register type="NOA" address="0x00009888" value="0x0E2C8000" />
+        <register type="NOA" address="0x00009888" value="0x162CAA00" />
+        <register type="NOA" address="0x00009888" value="0x182C00AA" />
+        <register type="NOA" address="0x00009888" value="0x022C8000" />
+        <register type="NOA" address="0x00009888" value="0x042C8000" />
+        <register type="NOA" address="0x00009888" value="0x062C8000" />
+        <register type="NOA" address="0x00009888" value="0x082C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x11907FFF" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900040" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900802" />
+        <register type="NOA" address="0x00009888" value="0x47900842" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900842" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900000" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x43900800" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007FC2A" />
+        <register type="OA" address="0x00002774" value="0x0000BF00" />
+        <register type="OA" address="0x00002778" value="0x0007FC6A" />
+        <register type="OA" address="0x0000277C" value="0x0000BF00" />
+        <register type="OA" address="0x00002780" value="0x0007FC92" />
+        <register type="OA" address="0x00002784" value="0x0000BF00" />
+        <register type="OA" address="0x00002788" value="0x0007FCA2" />
+        <register type="OA" address="0x0000278C" value="0x0000BF00" />
+        <register type="OA" address="0x00002790" value="0x0007FC32" />
+        <register type="OA" address="0x00002794" value="0x0000BF00" />
+        <register type="OA" address="0x00002798" value="0x0007FC9A" />
+        <register type="OA" address="0x0000279C" value="0x0000BF00" />
+        <register type="OA" address="0x000027A0" value="0x0007FE6A" />
+        <register type="OA" address="0x000027A4" value="0x0000BF00" />
+        <register type="OA" address="0x000027A8" value="0x0007FE7A" />
+        <register type="OA" address="0x000027AC" value="0x0000BF00" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00000003" />
+        <register type="FLEX" address="0x0000E658" value="0x00002001" />
+        <register type="FLEX" address="0x0000E758" value="0x00778008" />
+        <register type="FLEX" address="0x0000E45C" value="0x00088078" />
+        <register type="FLEX" address="0x0000E55C" value="0x00808708" />
+        <register type="FLEX" address="0x0000E65C" value="0x00A08908" />
+    </register_config>
+  </set>
+
+  <set name="Compute Metrics L3 Cache Gen9"
+       mdapi_supported_apis="VK VK OGL4 OCL IO BB"
+       underscore_name="compute_l3_cache"
+       hw_config_guid="4e4392e9-8f73-457b-ab44-b49f7a0c733b"
+       chipset="SKLGT4"
+       symbol_name="ComputeL3Cache"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Bank 03 Accesses"
+             description="The total number of accesses to L3 Bank 03."
+             data_type="uint64"
+             equation="B 3 READ 2 UMUL"
+             underscore_name="l3_bank03_accesses"
+             units="messages"
+             symbol_name="L3Bank03Accesses"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="L3 Accesses"
+             description="The total number of L3 accesses from all entities."
+             data_type="uint64"
+             equation="C 0 READ C 1 READ B 2 READ B 3 READ UADD UADD UADD 2 UMUL"
+             underscore_name="l3_accesses"
+             units="messages"
+             symbol_name="L3Accesses"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Sampler Throughput"
+             description="The total number of GPU memory bytes transferred between samplers and L3 caches."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 29 READ 64 UMUL"
+             underscore_name="l3_sampler_throughput"
+             units="bytes"
+             symbol_name="L3SamplerThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Sampler"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu0_active"
+             units="percent"
+             symbol_name="Fpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active"
+             units="percent"
+             symbol_name="Fpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU AVG IPC Rate"
+             description="The average rate of IPC calculated for 2 FPU pipelines."
+             data_type="float"
+             max_equation="2"
+             equation="A 9 READ  A 10 READ  A 11 READ UADD  A 9 READ USUB FDIV 1 FADD"
+             underscore_name="eu_avg_ipc_rate"
+             units="number"
+             symbol_name="EuAvgIpcRate"
+             semantic_type="ratio"
+             mdapi_supported_apis="VK VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Binary Instruction"
+             description="The percentage of time in which execution units were actively processing binary instructions on FPU0."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_binary_fpu0_instruction"
+             units="percent"
+             symbol_name="EuBinaryFpu0Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="EU FPU0 Hybrid Instruction"
+             description="The percentage of time in which execution units were actively processing hybrid instructions on FPU0."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_hybrid_fpu0_instruction"
+             units="percent"
+             symbol_name="EuHybridFpu0Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Misses"
+             description="The total number of L3 misses."
+             data_type="uint64"
+             equation="C 4 READ C 5 READ UADD"
+             underscore_name="l3_misses"
+             units="messages"
+             symbol_name="L3Misses"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/TAG"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="L3 Bank 00 Accesses"
+             description="The total number of accesses to L3 Bank 00."
+             data_type="uint64"
+             equation="C 0 READ 2 UMUL"
+             underscore_name="l3_bank00_accesses"
+             units="messages"
+             symbol_name="L3Bank00Accesses"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="EU FPU0 Move Instruction"
+             description="The percentage of time in which execution units were actively processing move instructions on FPU0."
+             data_type="float"
+             max_equation="100"
+             equation="A 19 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_move_fpu0_instruction"
+             units="percent"
+             symbol_name="EuMoveFpu0Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU FPU1 Hybrid Instruction"
+             description="The percentage of time in which execution units were actively processing hybrid instructions on FPU1."
+             data_type="float"
+             max_equation="100"
+             equation="A 14 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_hybrid_fpu1_instruction"
+             units="percent"
+             symbol_name="EuHybridFpu1Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Read Throughput"
+             description="The total number of GPU memory bytes read from GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="C 6 READ 64 UMUL"
+             underscore_name="gti_read_throughput"
+             units="bytes"
+             symbol_name="GtiReadThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI L3 Throughput"
+             description="The total number of GPU memory bytes transferred between L3 caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 4 READ C 5 READ UADD 64 UMUL"
+             underscore_name="gti_l3_throughput"
+             units="bytes"
+             symbol_name="GtiL3Throughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Bank 00 IC Accesses"
+             description="The total number of accesses to L3 Bank 00 from IC cache."
+             data_type="uint64"
+             equation="B 0 READ B 1 READ UADD 2 UMUL $L3Bank00Accesses UMIN"
+             underscore_name="l3_bank00_ic_accesses"
+             units="messages"
+             symbol_name="L3Bank00IcAccesses"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3/IC"
+             />
+    <counter name="L3 Bank 00 IC Hits"
+             description="The total number of hits in L3 Bank 00 from IC cache."
+             data_type="uint64"
+             equation="B 1 READ 2 UMUL $L3Bank00IcAccesses UMIN"
+             underscore_name="l3_bank00_ic_hits"
+             units="messages"
+             symbol_name="L3Bank00IcHits"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3/IC"
+             />
+    <counter name="Sampler Accesses"
+             description="The total number of messages send to samplers."
+             data_type="uint64"
+             equation="A 28 READ"
+             underscore_name="sampler_accesses"
+             units="messages"
+             symbol_name="SamplerAccesses"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler"
+             />
+    <counter name="L3 Bank 01 Accesses"
+             description="The total number of accesses to L3 Bank 01."
+             data_type="uint64"
+             equation="C 1 READ 2 UMUL"
+             underscore_name="l3_bank01_accesses"
+             units="messages"
+             symbol_name="L3Bank01Accesses"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Ternary Instruction"
+             description="The percentage of time in which execution units were actively processing ternary instructions on FPU0."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_ternary_fpu0_instruction"
+             units="percent"
+             symbol_name="EuTernaryFpu0Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU FPU1 Move Instruction"
+             description="The percentage of time in which execution units were actively processing move instructions on FPU1."
+             data_type="float"
+             max_equation="100"
+             equation="A 20 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_move_fpu1_instruction"
+             units="percent"
+             symbol_name="EuMoveFpu1Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="L3 Bank 02 Accesses"
+             description="The total number of accesses to L3 Bank 02."
+             data_type="uint64"
+             equation="B 2 READ 2 UMUL"
+             underscore_name="l3_bank02_accesses"
+             units="messages"
+             symbol_name="L3Bank02Accesses"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="L3 Total Throughput"
+             description="The total number of GPU memory bytes transferred via L3."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="$L3Accesses 64 UMUL"
+             underscore_name="l3_total_throughput"
+             units="bytes"
+             symbol_name="L3TotalThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Write Throughput"
+             description="The total number of GPU memory bytes written to GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 32 UMUL"
+             equation="C 7 READ 64 UMUL"
+             underscore_name="gti_write_throughput"
+             units="bytes"
+             symbol_name="GtiWriteThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="EU FPU1 Binary Instruction"
+             description="The percentage of time in which execution units were actively processing binary instructions on FPU1."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_binary_fpu1_instruction"
+             units="percent"
+             symbol_name="EuBinaryFpu1Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Ternary Instruction"
+             description="The percentage of time in which execution units were actively processing ternary instructions on FPU1."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_ternary_fpu1_instruction"
+             units="percent"
+             symbol_name="EuTernaryFpu1Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_send_active"
+             units="percent"
+             symbol_name="EuSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x166C0760" />
+        <register type="NOA" address="0x00009888" value="0x1593001E" />
+        <register type="NOA" address="0x00009888" value="0x3F900003" />
+        <register type="NOA" address="0x00009888" value="0x004E8000" />
+        <register type="NOA" address="0x00009888" value="0x0E4E8000" />
+        <register type="NOA" address="0x00009888" value="0x184E8000" />
+        <register type="NOA" address="0x00009888" value="0x1A4E8020" />
+        <register type="NOA" address="0x00009888" value="0x1C4E0002" />
+        <register type="NOA" address="0x00009888" value="0x006C0051" />
+        <register type="NOA" address="0x00009888" value="0x066C5000" />
+        <register type="NOA" address="0x00009888" value="0x086C5C5D" />
+        <register type="NOA" address="0x00009888" value="0x0E6C5E5F" />
+        <register type="NOA" address="0x00009888" value="0x106C0000" />
+        <register type="NOA" address="0x00009888" value="0x186C0000" />
+        <register type="NOA" address="0x00009888" value="0x1C6C0000" />
+        <register type="NOA" address="0x00009888" value="0x1E6C0000" />
+        <register type="NOA" address="0x00009888" value="0x001B4000" />
+        <register type="NOA" address="0x00009888" value="0x061B8000" />
+        <register type="NOA" address="0x00009888" value="0x081BC000" />
+        <register type="NOA" address="0x00009888" value="0x0E1BC000" />
+        <register type="NOA" address="0x00009888" value="0x101C8000" />
+        <register type="NOA" address="0x00009888" value="0x1A1CE000" />
+        <register type="NOA" address="0x00009888" value="0x1C1C0030" />
+        <register type="NOA" address="0x00009888" value="0x004C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C2A00" />
+        <register type="NOA" address="0x00009888" value="0x0C4C0280" />
+        <register type="NOA" address="0x00009888" value="0x000D2000" />
+        <register type="NOA" address="0x00009888" value="0x060D8000" />
+        <register type="NOA" address="0x00009888" value="0x080DA000" />
+        <register type="NOA" address="0x00009888" value="0x0E0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F0400" />
+        <register type="NOA" address="0x00009888" value="0x0E0F1500" />
+        <register type="NOA" address="0x00009888" value="0x100F0140" />
+        <register type="NOA" address="0x00009888" value="0x002C8000" />
+        <register type="NOA" address="0x00009888" value="0x0E2C8000" />
+        <register type="NOA" address="0x00009888" value="0x162C0A00" />
+        <register type="NOA" address="0x00009888" value="0x182C00A0" />
+        <register type="NOA" address="0x00009888" value="0x03933300" />
+        <register type="NOA" address="0x00009888" value="0x05930032" />
+        <register type="NOA" address="0x00009888" value="0x11930000" />
+        <register type="NOA" address="0x00009888" value="0x1B930000" />
+        <register type="NOA" address="0x00009888" value="0x1D900157" />
+        <register type="NOA" address="0x00009888" value="0x1F900158" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B908000" />
+        <register type="NOA" address="0x00009888" value="0x1190030F" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900000" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900021" />
+        <register type="NOA" address="0x00009888" value="0x47900000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900000" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x53905555" />
+        <register type="NOA" address="0x00009888" value="0x43900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x30800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x30800000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007FFFA" />
+        <register type="OA" address="0x00002774" value="0x0000FEFE" />
+        <register type="OA" address="0x00002778" value="0x0007FFFA" />
+        <register type="OA" address="0x0000277C" value="0x0000FEFD" />
+        <register type="OA" address="0x00002790" value="0x0007FFFA" />
+        <register type="OA" address="0x00002794" value="0x0000FBEF" />
+        <register type="OA" address="0x00002798" value="0x0007FFFA" />
+        <register type="OA" address="0x0000279C" value="0x0000FBDF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00000003" />
+        <register type="FLEX" address="0x0000E658" value="0x00002001" />
+        <register type="FLEX" address="0x0000E758" value="0x00101100" />
+        <register type="FLEX" address="0x0000E45C" value="0x00201200" />
+        <register type="FLEX" address="0x0000E55C" value="0x00301300" />
+        <register type="FLEX" address="0x0000E65C" value="0x00401400" />
+    </register_config>
+  </set>
+
+  <set name="Metric set HDCAndSF"
+       mdapi_supported_apis="VK VK OGL OCL IO BB"
+       underscore_name="hdc_and_sf"
+       hw_config_guid="75f56991-b149-4122-ade9-d9c0c80c733b"
+       chipset="SKLGT4"
+       symbol_name="HDCAndSF"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="Polygon Data Ready"
+             description="The percentage of time in which geometry pipeline output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="poly_data_ready"
+             units="percent"
+             symbol_name="PolyDataReady"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe/Strip-Fans"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="HDC stalled by L3 (s0.ss1)"
+             description="Percentage of time when HDC has messges to L3, but it's stalled due to lack of credits (s0.ss1)"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ C 4 READ USUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader01_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader01AccessStalledOnL3"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="HDC stalled by L3 (s0.ss2)"
+             description="Percentage of time when HDC has messges to L3, but it's stalled due to lack of credits (s0.ss2)"
+             data_type="float"
+             max_equation="100"
+             equation="C 3 READ C 2 READ USUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader02_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader02AccessStalledOnL3"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="HDC stalled by L3 (s0.ss0)"
+             description="Percentage of time when HDC has messges to L3, but it's stalled due to lack of credits (s0.ss0)"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ C 6 READ USUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader00_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader00AccessStalledOnL3"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x104F0232" />
+        <register type="NOA" address="0x00009888" value="0x124F4640" />
+        <register type="NOA" address="0x00009888" value="0x106C0232" />
+        <register type="NOA" address="0x00009888" value="0x11834400" />
+        <register type="NOA" address="0x00009888" value="0x0A4E8000" />
+        <register type="NOA" address="0x00009888" value="0x0C4E8000" />
+        <register type="NOA" address="0x00009888" value="0x004F1880" />
+        <register type="NOA" address="0x00009888" value="0x024F08BB" />
+        <register type="NOA" address="0x00009888" value="0x044F001B" />
+        <register type="NOA" address="0x00009888" value="0x046C0100" />
+        <register type="NOA" address="0x00009888" value="0x066C000B" />
+        <register type="NOA" address="0x00009888" value="0x1A6C0000" />
+        <register type="NOA" address="0x00009888" value="0x041B8000" />
+        <register type="NOA" address="0x00009888" value="0x061B4000" />
+        <register type="NOA" address="0x00009888" value="0x1A1C1800" />
+        <register type="NOA" address="0x00009888" value="0x005B8000" />
+        <register type="NOA" address="0x00009888" value="0x025BC000" />
+        <register type="NOA" address="0x00009888" value="0x045B4000" />
+        <register type="NOA" address="0x00009888" value="0x125C8000" />
+        <register type="NOA" address="0x00009888" value="0x145C8000" />
+        <register type="NOA" address="0x00009888" value="0x165C8000" />
+        <register type="NOA" address="0x00009888" value="0x185C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C00A0" />
+        <register type="NOA" address="0x00009888" value="0x000D8000" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F5000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0055" />
+        <register type="NOA" address="0x00009888" value="0x022CC000" />
+        <register type="NOA" address="0x00009888" value="0x042CC000" />
+        <register type="NOA" address="0x00009888" value="0x062CC000" />
+        <register type="NOA" address="0x00009888" value="0x082CC000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0F828000" />
+        <register type="NOA" address="0x00009888" value="0x0F8305C0" />
+        <register type="NOA" address="0x00009888" value="0x09830000" />
+        <register type="NOA" address="0x00009888" value="0x07830000" />
+        <register type="NOA" address="0x00009888" value="0x1D950080" />
+        <register type="NOA" address="0x00009888" value="0x13928000" />
+        <register type="NOA" address="0x00009888" value="0x0F988000" />
+        <register type="NOA" address="0x00009888" value="0x31904000" />
+        <register type="NOA" address="0x00009888" value="0x1190FC00" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x59900001" />
+        <register type="NOA" address="0x00009888" value="0x4B900040" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900800" />
+        <register type="NOA" address="0x00009888" value="0x43900842" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x10800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00000002" />
+        <register type="OA" address="0x00002774" value="0x0000FDFF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set L3_1"
+       mdapi_supported_apis="VK VK OGL OCL IO BB"
+       underscore_name="l3_1"
+       hw_config_guid="0d4cda70-da83-466f-b61e-7a064fe6a232"
+       chipset="SKLGT4"
+       symbol_name="L3_1"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank1 Active"
+             description="The percentage of time in which slice0 L3 bank1 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank1_active"
+             units="percent"
+             symbol_name="L30Bank1Active"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="Slice0 L3 Bank1 Stalled"
+             description="The percentage of time in which slice0 L3 bank1 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank1_stalled"
+             units="percent"
+             symbol_name="L30Bank1Stalled"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank0 Active"
+             description="The percentage of time in which slice0 L3 bank0 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank0_active"
+             units="percent"
+             symbol_name="L30Bank0Active"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank0 Stalled"
+             description="The percentage of time in which slice0 L3 bank0 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank0_stalled"
+             units="percent"
+             symbol_name="L30Bank0Stalled"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x126C7B40" />
+        <register type="NOA" address="0x00009888" value="0x166C0020" />
+        <register type="NOA" address="0x00009888" value="0x0A603444" />
+        <register type="NOA" address="0x00009888" value="0x0A613400" />
+        <register type="NOA" address="0x00009888" value="0x1A4EA800" />
+        <register type="NOA" address="0x00009888" value="0x1C4E0002" />
+        <register type="NOA" address="0x00009888" value="0x024E8000" />
+        <register type="NOA" address="0x00009888" value="0x044E8000" />
+        <register type="NOA" address="0x00009888" value="0x064E8000" />
+        <register type="NOA" address="0x00009888" value="0x084E8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4E8000" />
+        <register type="NOA" address="0x00009888" value="0x064F4000" />
+        <register type="NOA" address="0x00009888" value="0x0C6C5327" />
+        <register type="NOA" address="0x00009888" value="0x0E6C5425" />
+        <register type="NOA" address="0x00009888" value="0x006C2A00" />
+        <register type="NOA" address="0x00009888" value="0x026C285B" />
+        <register type="NOA" address="0x00009888" value="0x046C005C" />
+        <register type="NOA" address="0x00009888" value="0x106C0000" />
+        <register type="NOA" address="0x00009888" value="0x1C6C0000" />
+        <register type="NOA" address="0x00009888" value="0x1E6C0000" />
+        <register type="NOA" address="0x00009888" value="0x1A6C0800" />
+        <register type="NOA" address="0x00009888" value="0x0C1BC000" />
+        <register type="NOA" address="0x00009888" value="0x0E1BC000" />
+        <register type="NOA" address="0x00009888" value="0x001B8000" />
+        <register type="NOA" address="0x00009888" value="0x021BC000" />
+        <register type="NOA" address="0x00009888" value="0x041BC000" />
+        <register type="NOA" address="0x00009888" value="0x1C1C003C" />
+        <register type="NOA" address="0x00009888" value="0x121C8000" />
+        <register type="NOA" address="0x00009888" value="0x141C8000" />
+        <register type="NOA" address="0x00009888" value="0x161C8000" />
+        <register type="NOA" address="0x00009888" value="0x181C8000" />
+        <register type="NOA" address="0x00009888" value="0x1A1C0800" />
+        <register type="NOA" address="0x00009888" value="0x065B4000" />
+        <register type="NOA" address="0x00009888" value="0x1A5C1000" />
+        <register type="NOA" address="0x00009888" value="0x10600000" />
+        <register type="NOA" address="0x00009888" value="0x04600000" />
+        <register type="NOA" address="0x00009888" value="0x0C610044" />
+        <register type="NOA" address="0x00009888" value="0x10610000" />
+        <register type="NOA" address="0x00009888" value="0x06610000" />
+        <register type="NOA" address="0x00009888" value="0x0C4C02A8" />
+        <register type="NOA" address="0x00009888" value="0x084CA000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C002A" />
+        <register type="NOA" address="0x00009888" value="0x0C0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0E0DA000" />
+        <register type="NOA" address="0x00009888" value="0x000D8000" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x100F0154" />
+        <register type="NOA" address="0x00009888" value="0x0C0F5000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0055" />
+        <register type="NOA" address="0x00009888" value="0x182C00AA" />
+        <register type="NOA" address="0x00009888" value="0x022C8000" />
+        <register type="NOA" address="0x00009888" value="0x042C8000" />
+        <register type="NOA" address="0x00009888" value="0x062C8000" />
+        <register type="NOA" address="0x00009888" value="0x082C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C2CC000" />
+        <register type="NOA" address="0x00009888" value="0x1190FFC0" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900420" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900021" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900400" />
+        <register type="NOA" address="0x00009888" value="0x43900421" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900040" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002770" value="0x00100070" />
+        <register type="OA" address="0x00002774" value="0x0000FFF1" />
+        <register type="OA" address="0x00002778" value="0x00014002" />
+        <register type="OA" address="0x0000277C" value="0x0000C3FF" />
+        <register type="OA" address="0x00002780" value="0x00010002" />
+        <register type="OA" address="0x00002784" value="0x0000C7FF" />
+        <register type="OA" address="0x00002788" value="0x00004002" />
+        <register type="OA" address="0x0000278C" value="0x0000D3FF" />
+        <register type="OA" address="0x00002790" value="0x00100700" />
+        <register type="OA" address="0x00002794" value="0x0000FF1F" />
+        <register type="OA" address="0x00002798" value="0x00001402" />
+        <register type="OA" address="0x0000279C" value="0x0000FC3F" />
+        <register type="OA" address="0x000027A0" value="0x00001002" />
+        <register type="OA" address="0x000027A4" value="0x0000FC7F" />
+        <register type="OA" address="0x000027A8" value="0x00000402" />
+        <register type="OA" address="0x000027AC" value="0x0000FD3F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set L3_2"
+       mdapi_supported_apis="VK VK OGL OCL IO BB"
+       underscore_name="l3_2"
+       hw_config_guid="20137ace-b110-4341-883f-1094c820093c"
+       chipset="SKLGT4"
+       symbol_name="L3_2"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank2 Stalled"
+             description="The percentage of time in which slice0 L3 bank2 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank2_stalled"
+             units="percent"
+             symbol_name="L30Bank2Stalled"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank2 Active"
+             description="The percentage of time in which slice0 L3 bank2 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank2_active"
+             units="percent"
+             symbol_name="L30Bank2Active"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x126C02E0" />
+        <register type="NOA" address="0x00009888" value="0x146C0001" />
+        <register type="NOA" address="0x00009888" value="0x0A623400" />
+        <register type="NOA" address="0x00009888" value="0x044E8000" />
+        <register type="NOA" address="0x00009888" value="0x064E8000" />
+        <register type="NOA" address="0x00009888" value="0x084E8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4E8000" />
+        <register type="NOA" address="0x00009888" value="0x064F4000" />
+        <register type="NOA" address="0x00009888" value="0x026C3324" />
+        <register type="NOA" address="0x00009888" value="0x046C3422" />
+        <register type="NOA" address="0x00009888" value="0x106C0000" />
+        <register type="NOA" address="0x00009888" value="0x1A6C0000" />
+        <register type="NOA" address="0x00009888" value="0x021BC000" />
+        <register type="NOA" address="0x00009888" value="0x041BC000" />
+        <register type="NOA" address="0x00009888" value="0x141C8000" />
+        <register type="NOA" address="0x00009888" value="0x161C8000" />
+        <register type="NOA" address="0x00009888" value="0x181C8000" />
+        <register type="NOA" address="0x00009888" value="0x1A1C0800" />
+        <register type="NOA" address="0x00009888" value="0x065B4000" />
+        <register type="NOA" address="0x00009888" value="0x1A5C1000" />
+        <register type="NOA" address="0x00009888" value="0x06614000" />
+        <register type="NOA" address="0x00009888" value="0x0C620044" />
+        <register type="NOA" address="0x00009888" value="0x10620000" />
+        <register type="NOA" address="0x00009888" value="0x06620000" />
+        <register type="NOA" address="0x00009888" value="0x084C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C002A" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F4000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0055" />
+        <register type="NOA" address="0x00009888" value="0x042C8000" />
+        <register type="NOA" address="0x00009888" value="0x062C8000" />
+        <register type="NOA" address="0x00009888" value="0x082C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C2CC000" />
+        <register type="NOA" address="0x00009888" value="0x1190F800" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x43900000" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00100070" />
+        <register type="OA" address="0x00002774" value="0x0000FFF1" />
+        <register type="OA" address="0x00002778" value="0x00028002" />
+        <register type="OA" address="0x0000277C" value="0x000087FF" />
+        <register type="OA" address="0x00002780" value="0x00020002" />
+        <register type="OA" address="0x00002784" value="0x00008FFF" />
+        <register type="OA" address="0x00002788" value="0x00008002" />
+        <register type="OA" address="0x0000278C" value="0x0000A7FF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set L3_3"
+       mdapi_supported_apis="VK VK OGL OCL IO BB"
+       underscore_name="l3_3"
+       hw_config_guid="d3a6b05e-46ef-44a8-96c3-9bd3e58acbe6"
+       chipset="SKLGT4"
+       symbol_name="L3_3"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Slice0 L3 Bank3 Stalled"
+             description="The percentage of time in which slice0 L3 bank3 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank3_stalled"
+             units="percent"
+             symbol_name="L30Bank3Stalled"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank3 Active"
+             description="The percentage of time in which slice0 L3 bank3 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank3_active"
+             units="percent"
+             symbol_name="L30Bank3Active"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x126C4E80" />
+        <register type="NOA" address="0x00009888" value="0x146C0000" />
+        <register type="NOA" address="0x00009888" value="0x0A633400" />
+        <register type="NOA" address="0x00009888" value="0x044E8000" />
+        <register type="NOA" address="0x00009888" value="0x064E8000" />
+        <register type="NOA" address="0x00009888" value="0x084E8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4E8000" />
+        <register type="NOA" address="0x00009888" value="0x0C4E8000" />
+        <register type="NOA" address="0x00009888" value="0x026C3321" />
+        <register type="NOA" address="0x00009888" value="0x046C342F" />
+        <register type="NOA" address="0x00009888" value="0x106C0000" />
+        <register type="NOA" address="0x00009888" value="0x1A6C2000" />
+        <register type="NOA" address="0x00009888" value="0x021BC000" />
+        <register type="NOA" address="0x00009888" value="0x041BC000" />
+        <register type="NOA" address="0x00009888" value="0x061B4000" />
+        <register type="NOA" address="0x00009888" value="0x141C8000" />
+        <register type="NOA" address="0x00009888" value="0x161C8000" />
+        <register type="NOA" address="0x00009888" value="0x181C8000" />
+        <register type="NOA" address="0x00009888" value="0x1A1C1800" />
+        <register type="NOA" address="0x00009888" value="0x06604000" />
+        <register type="NOA" address="0x00009888" value="0x0C630044" />
+        <register type="NOA" address="0x00009888" value="0x10630000" />
+        <register type="NOA" address="0x00009888" value="0x06630000" />
+        <register type="NOA" address="0x00009888" value="0x084C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C00AA" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F4000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0055" />
+        <register type="NOA" address="0x00009888" value="0x042C8000" />
+        <register type="NOA" address="0x00009888" value="0x062C8000" />
+        <register type="NOA" address="0x00009888" value="0x082C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C2C8000" />
+        <register type="NOA" address="0x00009888" value="0x1190F800" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x43900842" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900002" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00100070" />
+        <register type="OA" address="0x00002774" value="0x0000FFF1" />
+        <register type="OA" address="0x00002778" value="0x00028002" />
+        <register type="OA" address="0x0000277C" value="0x000087FF" />
+        <register type="OA" address="0x00002780" value="0x00020002" />
+        <register type="OA" address="0x00002784" value="0x00008FFF" />
+        <register type="OA" address="0x00002788" value="0x00008002" />
+        <register type="OA" address="0x0000278C" value="0x0000A7FF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set RasterizerAndPixelBackend"
+       mdapi_supported_apis="VK VK OGL OCL IO BB"
+       underscore_name="rasterizer_and_pixel_backend"
+       hw_config_guid="4081b948-63f1-4b1a-abaa-6017cb77a63b"
+       chipset="SKLGT4"
+       symbol_name="RasterizerAndPixelBackend"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Slice0 Pixel Values Ready"
+             description="The percentage of time in which slice0 pixel values are ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="pixel_values0_ready"
+             units="percent"
+             symbol_name="PixelValues0Ready"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="Slice0 Rasterizer Input Available"
+             description="The percentage of time in which slice0 rasterizer input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="rasterizer0_input_available"
+             units="percent"
+             symbol_name="Rasterizer0InputAvailable"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Slice0 Post-EarlyZ Pixel Data Ready"
+             description="The percentage of time in which slice0 post-EarlyZ pixel data is ready (after early Z tests have been applied)"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="pixel_data0_ready"
+             units="percent"
+             symbol_name="PixelData0Ready"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer/Early Depth Test"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 Rasterizer Output Ready"
+             description="The percentage of time in which slice0 rasterizer output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="rasterizer0_output_ready"
+             units="percent"
+             symbol_name="Rasterizer0OutputReady"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Slice0 PS Output Available"
+             description="The percentage of time in which slice0 PS output is available"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_output0_available"
+             units="percent"
+             symbol_name="PSOutput0Available"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x102F3800" />
+        <register type="NOA" address="0x00009888" value="0x144D0500" />
+        <register type="NOA" address="0x00009888" value="0x120D03C0" />
+        <register type="NOA" address="0x00009888" value="0x140D03CF" />
+        <register type="NOA" address="0x00009888" value="0x0C0F0004" />
+        <register type="NOA" address="0x00009888" value="0x0C4E4000" />
+        <register type="NOA" address="0x00009888" value="0x042F0480" />
+        <register type="NOA" address="0x00009888" value="0x082F0000" />
+        <register type="NOA" address="0x00009888" value="0x022F0000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C0090" />
+        <register type="NOA" address="0x00009888" value="0x064D0027" />
+        <register type="NOA" address="0x00009888" value="0x004D0000" />
+        <register type="NOA" address="0x00009888" value="0x000D0D40" />
+        <register type="NOA" address="0x00009888" value="0x020D803F" />
+        <register type="NOA" address="0x00009888" value="0x040D8023" />
+        <register type="NOA" address="0x00009888" value="0x100D0000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x020F0010" />
+        <register type="NOA" address="0x00009888" value="0x000F0000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0050" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C2C8000" />
+        <register type="NOA" address="0x00009888" value="0x1190FC00" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41901400" />
+        <register type="NOA" address="0x00009888" value="0x43901485" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900001" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x30800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00000002" />
+        <register type="OA" address="0x00002774" value="0x0000EFFF" />
+        <register type="OA" address="0x00002778" value="0x00006000" />
+        <register type="OA" address="0x0000277C" value="0x0000F3FF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set Sampler"
+       mdapi_supported_apis="VK VK OGL OCL IO BB"
+       underscore_name="sampler"
+       hw_config_guid="eae6bbb1-0e2b-478d-bd9e-f10ded2178f9"
+       chipset="SKLGT4"
+       symbol_name="Sampler"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 Subslice2 Input Available"
+             description="The percentage of time in which slice0 subslice2 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler02_input_available"
+             units="percent"
+             symbol_name="Sampler02InputAvailable"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 Subslice0 Input Available"
+             description="The percentage of time in which slice0 subslice0 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler00_input_available"
+             units="percent"
+             symbol_name="Sampler00InputAvailable"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="Slice0 Subslice2 Sampler Output Ready"
+             description="The percentage of time in which slice0 subslice2 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler02_output_ready"
+             units="percent"
+             symbol_name="Sampler02OutputReady"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Slice0 Subslice1 Input Available"
+             description="The percentage of time in which slice0 subslice1 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler01_input_available"
+             units="percent"
+             symbol_name="Sampler01InputAvailable"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Slice0 Subslice0 Sampler Output Ready"
+             description="The percentage of time in which slice0 subslice0 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler00_output_ready"
+             units="percent"
+             symbol_name="Sampler00OutputReady"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Slice0 Subslice1 Sampler Output Ready"
+             description="The percentage of time in which slice0 subslice1 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler01_output_ready"
+             units="percent"
+             symbol_name="Sampler01OutputReady"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x14152C00" />
+        <register type="NOA" address="0x00009888" value="0x16150005" />
+        <register type="NOA" address="0x00009888" value="0x121600A0" />
+        <register type="NOA" address="0x00009888" value="0x14352C00" />
+        <register type="NOA" address="0x00009888" value="0x16350005" />
+        <register type="NOA" address="0x00009888" value="0x123600A0" />
+        <register type="NOA" address="0x00009888" value="0x14552C00" />
+        <register type="NOA" address="0x00009888" value="0x16550005" />
+        <register type="NOA" address="0x00009888" value="0x125600A0" />
+        <register type="NOA" address="0x00009888" value="0x062F6000" />
+        <register type="NOA" address="0x00009888" value="0x022F2000" />
+        <register type="NOA" address="0x00009888" value="0x0C4C0050" />
+        <register type="NOA" address="0x00009888" value="0x0A4C0010" />
+        <register type="NOA" address="0x00009888" value="0x0C0D8000" />
+        <register type="NOA" address="0x00009888" value="0x0E0DA000" />
+        <register type="NOA" address="0x00009888" value="0x000D8000" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x100F0350" />
+        <register type="NOA" address="0x00009888" value="0x0C0FB000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F00DA" />
+        <register type="NOA" address="0x00009888" value="0x182C0028" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x022DC000" />
+        <register type="NOA" address="0x00009888" value="0x042D4000" />
+        <register type="NOA" address="0x00009888" value="0x0C138000" />
+        <register type="NOA" address="0x00009888" value="0x0E132000" />
+        <register type="NOA" address="0x00009888" value="0x0413C000" />
+        <register type="NOA" address="0x00009888" value="0x1C140018" />
+        <register type="NOA" address="0x00009888" value="0x0C157000" />
+        <register type="NOA" address="0x00009888" value="0x0E150078" />
+        <register type="NOA" address="0x00009888" value="0x10150000" />
+        <register type="NOA" address="0x00009888" value="0x04162180" />
+        <register type="NOA" address="0x00009888" value="0x02160000" />
+        <register type="NOA" address="0x00009888" value="0x04174000" />
+        <register type="NOA" address="0x00009888" value="0x0233A000" />
+        <register type="NOA" address="0x00009888" value="0x04333000" />
+        <register type="NOA" address="0x00009888" value="0x14348000" />
+        <register type="NOA" address="0x00009888" value="0x16348000" />
+        <register type="NOA" address="0x00009888" value="0x02357870" />
+        <register type="NOA" address="0x00009888" value="0x10350000" />
+        <register type="NOA" address="0x00009888" value="0x04360043" />
+        <register type="NOA" address="0x00009888" value="0x02360000" />
+        <register type="NOA" address="0x00009888" value="0x04371000" />
+        <register type="NOA" address="0x00009888" value="0x0E538000" />
+        <register type="NOA" address="0x00009888" value="0x00538000" />
+        <register type="NOA" address="0x00009888" value="0x06533000" />
+        <register type="NOA" address="0x00009888" value="0x1C540020" />
+        <register type="NOA" address="0x00009888" value="0x12548000" />
+        <register type="NOA" address="0x00009888" value="0x0E557000" />
+        <register type="NOA" address="0x00009888" value="0x00557800" />
+        <register type="NOA" address="0x00009888" value="0x10550000" />
+        <register type="NOA" address="0x00009888" value="0x06560043" />
+        <register type="NOA" address="0x00009888" value="0x02560000" />
+        <register type="NOA" address="0x00009888" value="0x06571000" />
+        <register type="NOA" address="0x00009888" value="0x1190FF80" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900060" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900C00" />
+        <register type="NOA" address="0x00009888" value="0x43900842" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900060" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x70800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x0000C000" />
+        <register type="OA" address="0x00002774" value="0x0000E7FF" />
+        <register type="OA" address="0x00002778" value="0x00003000" />
+        <register type="OA" address="0x0000277C" value="0x0000F9FF" />
+        <register type="OA" address="0x00002780" value="0x00000C00" />
+        <register type="OA" address="0x00002784" value="0x0000FE7F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set TDL_1"
+       mdapi_supported_apis="VK VK OGL OCL IO BB"
+       underscore_name="tdl_1"
+       hw_config_guid="1bba4bd2-81d4-45ec-847f-bc363e17e14d"
+       chipset="SKLGT4"
+       symbol_name="TDL_1"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="NonPS Thread Ready For Dispatch on Slice0 Subslice2"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice2 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread02_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread02ReadyForDispatch"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="NonPS Thread Ready For Dispatch on Slice0 Subslice0"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice0 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread00_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread00ReadyForDispatch"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Subslice0"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice0 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread00_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread00ReadyForDispatch"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Subslice1"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice1 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread01_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread01ReadyForDispatch"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Subslice2"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice2 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread02_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread02ReadyForDispatch"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="NonPS Thread Ready For Dispatch on Slice0 Subslice1"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice1 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread01_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread01ReadyForDispatch"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x12120000" />
+        <register type="NOA" address="0x00009888" value="0x12320000" />
+        <register type="NOA" address="0x00009888" value="0x12520000" />
+        <register type="NOA" address="0x00009888" value="0x002F8000" />
+        <register type="NOA" address="0x00009888" value="0x022F3000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C0015" />
+        <register type="NOA" address="0x00009888" value="0x0C0D8000" />
+        <register type="NOA" address="0x00009888" value="0x0E0DA000" />
+        <register type="NOA" address="0x00009888" value="0x000D8000" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x100F03A0" />
+        <register type="NOA" address="0x00009888" value="0x0C0FF000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0095" />
+        <register type="NOA" address="0x00009888" value="0x062C8000" />
+        <register type="NOA" address="0x00009888" value="0x082C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C2D8000" />
+        <register type="NOA" address="0x00009888" value="0x0E2D4000" />
+        <register type="NOA" address="0x00009888" value="0x062D4000" />
+        <register type="NOA" address="0x00009888" value="0x02108000" />
+        <register type="NOA" address="0x00009888" value="0x0410C000" />
+        <register type="NOA" address="0x00009888" value="0x02118000" />
+        <register type="NOA" address="0x00009888" value="0x0411C000" />
+        <register type="NOA" address="0x00009888" value="0x02121880" />
+        <register type="NOA" address="0x00009888" value="0x041219B5" />
+        <register type="NOA" address="0x00009888" value="0x00120000" />
+        <register type="NOA" address="0x00009888" value="0x02134000" />
+        <register type="NOA" address="0x00009888" value="0x04135000" />
+        <register type="NOA" address="0x00009888" value="0x0C308000" />
+        <register type="NOA" address="0x00009888" value="0x0E304000" />
+        <register type="NOA" address="0x00009888" value="0x06304000" />
+        <register type="NOA" address="0x00009888" value="0x0C318000" />
+        <register type="NOA" address="0x00009888" value="0x0E314000" />
+        <register type="NOA" address="0x00009888" value="0x06314000" />
+        <register type="NOA" address="0x00009888" value="0x0C321A80" />
+        <register type="NOA" address="0x00009888" value="0x0E320033" />
+        <register type="NOA" address="0x00009888" value="0x06320031" />
+        <register type="NOA" address="0x00009888" value="0x00320000" />
+        <register type="NOA" address="0x00009888" value="0x0C334000" />
+        <register type="NOA" address="0x00009888" value="0x0E331000" />
+        <register type="NOA" address="0x00009888" value="0x06331000" />
+        <register type="NOA" address="0x00009888" value="0x0E508000" />
+        <register type="NOA" address="0x00009888" value="0x00508000" />
+        <register type="NOA" address="0x00009888" value="0x02504000" />
+        <register type="NOA" address="0x00009888" value="0x0E518000" />
+        <register type="NOA" address="0x00009888" value="0x00518000" />
+        <register type="NOA" address="0x00009888" value="0x02514000" />
+        <register type="NOA" address="0x00009888" value="0x0E521880" />
+        <register type="NOA" address="0x00009888" value="0x00521A80" />
+        <register type="NOA" address="0x00009888" value="0x02520033" />
+        <register type="NOA" address="0x00009888" value="0x0E534000" />
+        <register type="NOA" address="0x00009888" value="0x00534000" />
+        <register type="NOA" address="0x00009888" value="0x02531000" />
+        <register type="NOA" address="0x00009888" value="0x1190FF80" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900800" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900062" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900C00" />
+        <register type="NOA" address="0x00009888" value="0x43900003" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900040" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x30800000" />
+        <register type="OA" address="0x00002770" value="0x00000002" />
+        <register type="OA" address="0x00002774" value="0x00007FFF" />
+        <register type="OA" address="0x00002778" value="0x00000000" />
+        <register type="OA" address="0x0000277C" value="0x00009FFF" />
+        <register type="OA" address="0x00002780" value="0x00000002" />
+        <register type="OA" address="0x00002784" value="0x0000EFFF" />
+        <register type="OA" address="0x00002788" value="0x00000000" />
+        <register type="OA" address="0x0000278C" value="0x0000F3FF" />
+        <register type="OA" address="0x00002790" value="0x00000002" />
+        <register type="OA" address="0x00002794" value="0x0000FDFF" />
+        <register type="OA" address="0x00002798" value="0x00000000" />
+        <register type="OA" address="0x0000279C" value="0x0000FE7F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set TDL_2"
+       mdapi_supported_apis="VK VK OGL OCL IO BB"
+       underscore_name="tdl_2"
+       hw_config_guid="a4b3106c-cfec-49f5-8e26-470470379e66"
+       chipset="SKLGT4"
+       symbol_name="TDL_2"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice1 Port 0"
+             description="The percentage of time in which thread header is ready on slice0 subslice1 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header01_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader01ReadyPort0"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice1 Port 1"
+             description="The percentage of time in which thread header is ready on slice0 subslice1 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header01_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader01ReadyPort1"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice2 Port 1"
+             description="The percentage of time in which thread header is ready on slice0 subslice2 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header02_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader02ReadyPort1"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice2 Port 0"
+             description="The percentage of time in which thread header is ready on slice0 subslice2 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header02_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader02ReadyPort0"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK VK OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice0 Port 0"
+             description="The percentage of time in which thread header is ready on slice0 subslice0 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header00_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader00ReadyPort0"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="VK VK OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice0 Port 1"
+             description="The percentage of time in which thread header is ready on slice0 subslice0 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header00_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader00ReadyPort1"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x12124D60" />
+        <register type="NOA" address="0x00009888" value="0x12322E60" />
+        <register type="NOA" address="0x00009888" value="0x12524D60" />
+        <register type="NOA" address="0x00009888" value="0x022F3000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C0014" />
+        <register type="NOA" address="0x00009888" value="0x000D8000" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x0C0FE000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0097" />
+        <register type="NOA" address="0x00009888" value="0x082C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x002D8000" />
+        <register type="NOA" address="0x00009888" value="0x062D4000" />
+        <register type="NOA" address="0x00009888" value="0x0410C000" />
+        <register type="NOA" address="0x00009888" value="0x0411C000" />
+        <register type="NOA" address="0x00009888" value="0x04121FB7" />
+        <register type="NOA" address="0x00009888" value="0x00120000" />
+        <register type="NOA" address="0x00009888" value="0x04135000" />
+        <register type="NOA" address="0x00009888" value="0x00308000" />
+        <register type="NOA" address="0x00009888" value="0x06304000" />
+        <register type="NOA" address="0x00009888" value="0x00318000" />
+        <register type="NOA" address="0x00009888" value="0x06314000" />
+        <register type="NOA" address="0x00009888" value="0x00321B80" />
+        <register type="NOA" address="0x00009888" value="0x0632003F" />
+        <register type="NOA" address="0x00009888" value="0x00334000" />
+        <register type="NOA" address="0x00009888" value="0x06331000" />
+        <register type="NOA" address="0x00009888" value="0x0250C000" />
+        <register type="NOA" address="0x00009888" value="0x0251C000" />
+        <register type="NOA" address="0x00009888" value="0x02521FB7" />
+        <register type="NOA" address="0x00009888" value="0x00520000" />
+        <register type="NOA" address="0x00009888" value="0x02535000" />
+        <register type="NOA" address="0x00009888" value="0x1190FC00" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900800" />
+        <register type="NOA" address="0x00009888" value="0x43900063" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900040" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Compute Metrics Extra Gen9"
+       mdapi_supported_apis="VK VK OGL4 OCL IO BB"
+       underscore_name="compute_extra"
+       hw_config_guid="a5aa857d-e8f0-4dfa-8981-ce340fa748fd"
+       chipset="SKLGT4"
+       symbol_name="ComputeExtra"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active"
+             units="percent"
+             symbol_name="Fpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x121203E0" />
+        <register type="NOA" address="0x00009888" value="0x123203E0" />
+        <register type="NOA" address="0x00009888" value="0x125203E0" />
+        <register type="NOA" address="0x00009888" value="0x129203E0" />
+        <register type="NOA" address="0x00009888" value="0x12B203E0" />
+        <register type="NOA" address="0x00009888" value="0x12D203E0" />
+        <register type="NOA" address="0x00009888" value="0x131203E0" />
+        <register type="NOA" address="0x00009888" value="0x133203E0" />
+        <register type="NOA" address="0x00009888" value="0x135203E0" />
+        <register type="NOA" address="0x00009888" value="0x1A4EF000" />
+        <register type="NOA" address="0x00009888" value="0x1C4E0003" />
+        <register type="NOA" address="0x00009888" value="0x024EC000" />
+        <register type="NOA" address="0x00009888" value="0x044EC000" />
+        <register type="NOA" address="0x00009888" value="0x064EC000" />
+        <register type="NOA" address="0x00009888" value="0x022F4000" />
+        <register type="NOA" address="0x00009888" value="0x0C4C02A0" />
+        <register type="NOA" address="0x00009888" value="0x084CA000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C0042" />
+        <register type="NOA" address="0x00009888" value="0x0C0D8000" />
+        <register type="NOA" address="0x00009888" value="0x0E0DA000" />
+        <register type="NOA" address="0x00009888" value="0x000D8000" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x100F0150" />
+        <register type="NOA" address="0x00009888" value="0x0C0F5000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F006D" />
+        <register type="NOA" address="0x00009888" value="0x182C00A8" />
+        <register type="NOA" address="0x00009888" value="0x022C8000" />
+        <register type="NOA" address="0x00009888" value="0x042C8000" />
+        <register type="NOA" address="0x00009888" value="0x062C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C2C8000" />
+        <register type="NOA" address="0x00009888" value="0x042D8000" />
+        <register type="NOA" address="0x00009888" value="0x06104000" />
+        <register type="NOA" address="0x00009888" value="0x06114000" />
+        <register type="NOA" address="0x00009888" value="0x06120033" />
+        <register type="NOA" address="0x00009888" value="0x00120000" />
+        <register type="NOA" address="0x00009888" value="0x06131000" />
+        <register type="NOA" address="0x00009888" value="0x04308000" />
+        <register type="NOA" address="0x00009888" value="0x04318000" />
+        <register type="NOA" address="0x00009888" value="0x04321980" />
+        <register type="NOA" address="0x00009888" value="0x00320000" />
+        <register type="NOA" address="0x00009888" value="0x04334000" />
+        <register type="NOA" address="0x00009888" value="0x04504000" />
+        <register type="NOA" address="0x00009888" value="0x04514000" />
+        <register type="NOA" address="0x00009888" value="0x04520033" />
+        <register type="NOA" address="0x00009888" value="0x00520000" />
+        <register type="NOA" address="0x00009888" value="0x04531000" />
+        <register type="NOA" address="0x00009888" value="0x1ACEF000" />
+        <register type="NOA" address="0x00009888" value="0x1CCE0003" />
+        <register type="NOA" address="0x00009888" value="0x00AF8000" />
+        <register type="NOA" address="0x00009888" value="0x0CCC02A0" />
+        <register type="NOA" address="0x00009888" value="0x0ACC0001" />
+        <register type="NOA" address="0x00009888" value="0x0C8D8000" />
+        <register type="NOA" address="0x00009888" value="0x0E8DA000" />
+        <register type="NOA" address="0x00009888" value="0x008D8000" />
+        <register type="NOA" address="0x00009888" value="0x028DA000" />
+        <register type="NOA" address="0x00009888" value="0x108F0150" />
+        <register type="NOA" address="0x00009888" value="0x0C8FB000" />
+        <register type="NOA" address="0x00009888" value="0x0E8F0001" />
+        <register type="NOA" address="0x00009888" value="0x18AC00A8" />
+        <register type="NOA" address="0x00009888" value="0x06AC8000" />
+        <register type="NOA" address="0x00009888" value="0x02AD4000" />
+        <register type="NOA" address="0x00009888" value="0x02908000" />
+        <register type="NOA" address="0x00009888" value="0x02918000" />
+        <register type="NOA" address="0x00009888" value="0x02921980" />
+        <register type="NOA" address="0x00009888" value="0x00920000" />
+        <register type="NOA" address="0x00009888" value="0x02934000" />
+        <register type="NOA" address="0x00009888" value="0x02B04000" />
+        <register type="NOA" address="0x00009888" value="0x02B14000" />
+        <register type="NOA" address="0x00009888" value="0x02B20033" />
+        <register type="NOA" address="0x00009888" value="0x00B20000" />
+        <register type="NOA" address="0x00009888" value="0x02B31000" />
+        <register type="NOA" address="0x00009888" value="0x00D08000" />
+        <register type="NOA" address="0x00009888" value="0x00D18000" />
+        <register type="NOA" address="0x00009888" value="0x00D21980" />
+        <register type="NOA" address="0x00009888" value="0x00D34000" />
+        <register type="NOA" address="0x00009888" value="0x072F8000" />
+        <register type="NOA" address="0x00009888" value="0x0D4C0100" />
+        <register type="NOA" address="0x00009888" value="0x0D0D8000" />
+        <register type="NOA" address="0x00009888" value="0x0F0DA000" />
+        <register type="NOA" address="0x00009888" value="0x110F01B0" />
+        <register type="NOA" address="0x00009888" value="0x192C0080" />
+        <register type="NOA" address="0x00009888" value="0x0F2D4000" />
+        <register type="NOA" address="0x00009888" value="0x0F108000" />
+        <register type="NOA" address="0x00009888" value="0x0F118000" />
+        <register type="NOA" address="0x00009888" value="0x0F121980" />
+        <register type="NOA" address="0x00009888" value="0x01120000" />
+        <register type="NOA" address="0x00009888" value="0x0F134000" />
+        <register type="NOA" address="0x00009888" value="0x0F304000" />
+        <register type="NOA" address="0x00009888" value="0x0F314000" />
+        <register type="NOA" address="0x00009888" value="0x0F320033" />
+        <register type="NOA" address="0x00009888" value="0x01320000" />
+        <register type="NOA" address="0x00009888" value="0x0F331000" />
+        <register type="NOA" address="0x00009888" value="0x0D508000" />
+        <register type="NOA" address="0x00009888" value="0x0D518000" />
+        <register type="NOA" address="0x00009888" value="0x0D521980" />
+        <register type="NOA" address="0x00009888" value="0x01520000" />
+        <register type="NOA" address="0x00009888" value="0x0D534000" />
+        <register type="NOA" address="0x00009888" value="0x1190FF80" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900C00" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900002" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x51901100" />
+        <register type="NOA" address="0x00009888" value="0x41901000" />
+        <register type="NOA" address="0x00009888" value="0x43901423" />
+        <register type="NOA" address="0x00009888" value="0x53903331" />
+        <register type="NOA" address="0x00009888" value="0x45900044" />
+    </register_config>
+  </set>
+
+  <set name="Media Vme Pipe Gen9"
+       mdapi_supported_apis="MEDIA IO BB"
+       underscore_name="vme_pipe"
+       hw_config_guid="0e8d8b86-4ee7-4cdd-aaaa-58adc92cb29e"
+       chipset="SKLGT4"
+       symbol_name="VMEPipe"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="EU Thread Occupancy"
+             description="The percentage of time in which hardware threads occupied EUs."
+             data_type="float"
+             max_equation="100"
+             equation="8 A 10 READ FMUL $EuThreadsCount FDIV $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_thread_occupancy"
+             units="percent"
+             symbol_name="EuThreadOccupancy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VME Busy"
+             description="The percentage of time in which VME (IME or CRE) was actively processing data."
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ B 3 READ FADD 2 FDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vme_busy"
+             units="percent"
+             symbol_name="VMEBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Overview System Batch Tier2"
+             mdapi_group="VME Pipe"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x141A5800" />
+        <register type="NOA" address="0x00009888" value="0x161A00C0" />
+        <register type="NOA" address="0x00009888" value="0x12180240" />
+        <register type="NOA" address="0x00009888" value="0x14180002" />
+        <register type="NOA" address="0x00009888" value="0x149A5800" />
+        <register type="NOA" address="0x00009888" value="0x169A00C0" />
+        <register type="NOA" address="0x00009888" value="0x12980240" />
+        <register type="NOA" address="0x00009888" value="0x14980002" />
+        <register type="NOA" address="0x00009888" value="0x1A4E3FC0" />
+        <register type="NOA" address="0x00009888" value="0x002F1000" />
+        <register type="NOA" address="0x00009888" value="0x022F8000" />
+        <register type="NOA" address="0x00009888" value="0x042F3000" />
+        <register type="NOA" address="0x00009888" value="0x004C4000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C9500" />
+        <register type="NOA" address="0x00009888" value="0x0C4C002A" />
+        <register type="NOA" address="0x00009888" value="0x000D2000" />
+        <register type="NOA" address="0x00009888" value="0x060D8000" />
+        <register type="NOA" address="0x00009888" value="0x080DA000" />
+        <register type="NOA" address="0x00009888" value="0x0A0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F0400" />
+        <register type="NOA" address="0x00009888" value="0x0E0F5500" />
+        <register type="NOA" address="0x00009888" value="0x100F0015" />
+        <register type="NOA" address="0x00009888" value="0x002C8000" />
+        <register type="NOA" address="0x00009888" value="0x0E2C8000" />
+        <register type="NOA" address="0x00009888" value="0x162CAA00" />
+        <register type="NOA" address="0x00009888" value="0x182C000A" />
+        <register type="NOA" address="0x00009888" value="0x04193000" />
+        <register type="NOA" address="0x00009888" value="0x081A28C1" />
+        <register type="NOA" address="0x00009888" value="0x001A0000" />
+        <register type="NOA" address="0x00009888" value="0x00133000" />
+        <register type="NOA" address="0x00009888" value="0x0613C000" />
+        <register type="NOA" address="0x00009888" value="0x0813F000" />
+        <register type="NOA" address="0x00009888" value="0x00172000" />
+        <register type="NOA" address="0x00009888" value="0x06178000" />
+        <register type="NOA" address="0x00009888" value="0x0817A000" />
+        <register type="NOA" address="0x00009888" value="0x00180037" />
+        <register type="NOA" address="0x00009888" value="0x06180940" />
+        <register type="NOA" address="0x00009888" value="0x08180000" />
+        <register type="NOA" address="0x00009888" value="0x02180000" />
+        <register type="NOA" address="0x00009888" value="0x04183000" />
+        <register type="NOA" address="0x00009888" value="0x04AFC000" />
+        <register type="NOA" address="0x00009888" value="0x06AF3000" />
+        <register type="NOA" address="0x00009888" value="0x0ACC4000" />
+        <register type="NOA" address="0x00009888" value="0x0CCC0015" />
+        <register type="NOA" address="0x00009888" value="0x0A8DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C8DA000" />
+        <register type="NOA" address="0x00009888" value="0x0E8F4000" />
+        <register type="NOA" address="0x00009888" value="0x108F0015" />
+        <register type="NOA" address="0x00009888" value="0x16ACA000" />
+        <register type="NOA" address="0x00009888" value="0x18AC000A" />
+        <register type="NOA" address="0x00009888" value="0x06993000" />
+        <register type="NOA" address="0x00009888" value="0x0C9A28C1" />
+        <register type="NOA" address="0x00009888" value="0x009A0000" />
+        <register type="NOA" address="0x00009888" value="0x0A93F000" />
+        <register type="NOA" address="0x00009888" value="0x0C93F000" />
+        <register type="NOA" address="0x00009888" value="0x0A97A000" />
+        <register type="NOA" address="0x00009888" value="0x0C97A000" />
+        <register type="NOA" address="0x00009888" value="0x0A980977" />
+        <register type="NOA" address="0x00009888" value="0x08980000" />
+        <register type="NOA" address="0x00009888" value="0x04980000" />
+        <register type="NOA" address="0x00009888" value="0x06983000" />
+        <register type="NOA" address="0x00009888" value="0x119000FF" />
+        <register type="NOA" address="0x00009888" value="0x51900010" />
+        <register type="NOA" address="0x00009888" value="0x41900060" />
+        <register type="NOA" address="0x00009888" value="0x55900111" />
+        <register type="NOA" address="0x00009888" value="0x45900C00" />
+        <register type="NOA" address="0x00009888" value="0x47900821" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900002" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x30800000" />
+        <register type="OA" address="0x00002770" value="0x00100030" />
+        <register type="OA" address="0x00002774" value="0x0000FFF9" />
+        <register type="OA" address="0x00002778" value="0x00000002" />
+        <register type="OA" address="0x0000277C" value="0x0000FFFC" />
+        <register type="OA" address="0x00002780" value="0x00000002" />
+        <register type="OA" address="0x00002784" value="0x0000FFF3" />
+        <register type="OA" address="0x00002788" value="0x00100180" />
+        <register type="OA" address="0x0000278C" value="0x0000FFCF" />
+        <register type="OA" address="0x00002790" value="0x00000002" />
+        <register type="OA" address="0x00002794" value="0x0000FFCF" />
+        <register type="OA" address="0x00002798" value="0x00000002" />
+        <register type="OA" address="0x0000279C" value="0x0000FF3F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00008003" />
+    </register_config>
+  </set>
+
+  <set name="Gpu Rings Busyness"
+       mdapi_supported_apis="VK VK OGL OCL MEDIA IO BB"
+       underscore_name="gpu_busyness"
+       hw_config_guid="4e5b1599-5b01-4b3d-89fa-6b26a25fe02b"
+       chipset="SKLGT4"
+       symbol_name="GpuBusyness"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="Vebox Ring Busy"
+             description="The percentage of time when vebox command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vebox_busy"
+             units="percent"
+             symbol_name="VeboxBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Render Ring Busy"
+             description="The percentage of time when render command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="render_busy"
+             units="percent"
+             symbol_name="RenderBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Vdbox0 Ring Busy"
+             description="The percentage of time when Vdbox0 command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vdbox0_busy"
+             units="percent"
+             symbol_name="Vdbox0Busy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Blitter Ring Busy"
+             description="The percentage of time when blitter command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="blitter_busy"
+             units="percent"
+             symbol_name="BlitterBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="AnyRingBusy"
+             description="The percentage of time when any command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="any_ring_busy"
+             units="percent"
+             symbol_name="AnyRingBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Vdbox1 Ring Busy"
+             description="The percentage of time when Vdbox1 command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vdbox1_busy"
+             units="percent"
+             symbol_name="Vdbox1Busy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x21D05800" />
+        <register type="NOA" address="0x00009888" value="0x13805800" />
+        <register type="NOA" address="0x00009888" value="0x05962C25" />
+        <register type="NOA" address="0x00009888" value="0x19950016" />
+        <register type="NOA" address="0x00009888" value="0x21C05800" />
+        <register type="NOA" address="0x00009888" value="0x09D000A5" />
+        <register type="NOA" address="0x00009888" value="0x11D00000" />
+        <register type="NOA" address="0x00009888" value="0x05D00000" />
+        <register type="NOA" address="0x00009888" value="0x09D54000" />
+        <register type="NOA" address="0x00009888" value="0x07800035" />
+        <register type="NOA" address="0x00009888" value="0x11800000" />
+        <register type="NOA" address="0x00009888" value="0x1D810400" />
+        <register type="NOA" address="0x00009888" value="0x21960000" />
+        <register type="NOA" address="0x00009888" value="0x0996C000" />
+        <register type="NOA" address="0x00009888" value="0x0B964000" />
+        <register type="NOA" address="0x00009888" value="0x19938000" />
+        <register type="NOA" address="0x00009888" value="0x1B930068" />
+        <register type="NOA" address="0x00009888" value="0x15948000" />
+        <register type="NOA" address="0x00009888" value="0x1B94000C" />
+        <register type="NOA" address="0x00009888" value="0x03957500" />
+        <register type="NOA" address="0x00009888" value="0x1D950000" />
+        <register type="NOA" address="0x00009888" value="0x17950000" />
+        <register type="NOA" address="0x00009888" value="0x07E54000" />
+        <register type="NOA" address="0x00009888" value="0x07928000" />
+        <register type="NOA" address="0x00009888" value="0x03988000" />
+        <register type="NOA" address="0x00009888" value="0x17908000" />
+        <register type="NOA" address="0x00009888" value="0x19904000" />
+        <register type="NOA" address="0x00009888" value="0x1B908000" />
+        <register type="NOA" address="0x00009888" value="0x1D908000" />
+        <register type="NOA" address="0x00009888" value="0x1F908000" />
+        <register type="NOA" address="0x00009888" value="0x09978000" />
+        <register type="NOA" address="0x00009888" value="0x0BC000A5" />
+        <register type="NOA" address="0x00009888" value="0x11C00000" />
+        <register type="NOA" address="0x00009888" value="0x05C00000" />
+        <register type="NOA" address="0x00009888" value="0x0BC54000" />
+        <register type="NOA" address="0x00009888" value="0x11900000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x43900463" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900040" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x10800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x0007C000" />
+        <register type="OA" address="0x00002774" value="0x000007FF" />
+    </register_config>
+  </set>
+
+  <set name="MDAPI testing set Gen9"
+       mdapi_supported_apis="VK VK OGL OCL IO BB"
+       underscore_name="test_oa"
+       hw_config_guid="882fa433-1f4a-4a67-a962-c741888fe5f5"
+       chipset="SKLGT4"
+       symbol_name="TestOa"
+       >
+    <counter name="TestCounter7"
+             description="HW test counter 7. Factor: 0.666"
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="counter7"
+             units="events"
+             symbol_name="Counter7"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="TestCounter8"
+             description="HW test counter 8. Should be equal to 1."
+             data_type="uint64"
+             equation="C 7 READ"
+             underscore_name="counter8"
+             units="events"
+             symbol_name="Counter8"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter4"
+             description="HW test counter 4. Factor: 0.333"
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="counter4"
+             units="events"
+             symbol_name="Counter4"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter5"
+             description="HW test counter 5. Factor: 0.333"
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="counter5"
+             units="events"
+             symbol_name="Counter5"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter6"
+             description="HW test counter 6. Factor: 0.166"
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="counter6"
+             units="events"
+             symbol_name="Counter6"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter3"
+             description="HW test counter 3. Factor: 0.5"
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="counter3"
+             units="events"
+             symbol_name="Counter3"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter0"
+             description="HW test counter 0. Factor: 0.0"
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="counter0"
+             units="events"
+             symbol_name="Counter0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter1"
+             description="HW test counter 1. Factor: 1.0"
+             data_type="uint64"
+             equation="B 1 READ"
+             underscore_name="counter1"
+             units="events"
+             symbol_name="Counter1"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter2"
+             description="HW test counter 2. Factor: 1.0"
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="counter2"
+             units="events"
+             symbol_name="Counter2"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x11810000" />
+        <register type="NOA" address="0x00009888" value="0x07810013" />
+        <register type="NOA" address="0x00009888" value="0x1F810000" />
+        <register type="NOA" address="0x00009888" value="0x1D810000" />
+        <register type="NOA" address="0x00009888" value="0x1B930040" />
+        <register type="NOA" address="0x00009888" value="0x07E54000" />
+        <register type="NOA" address="0x00009888" value="0x1F908000" />
+        <register type="NOA" address="0x00009888" value="0x11900000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x00000004" />
+        <register type="OA" address="0x00002774" value="0x00000000" />
+        <register type="OA" address="0x00002778" value="0x00000003" />
+        <register type="OA" address="0x0000277C" value="0x00000000" />
+        <register type="OA" address="0x00002780" value="0x00000007" />
+        <register type="OA" address="0x00002784" value="0x00000000" />
+        <register type="OA" address="0x00002788" value="0x00100002" />
+        <register type="OA" address="0x0000278C" value="0x0000FFF7" />
+        <register type="OA" address="0x00002790" value="0x00100002" />
+        <register type="OA" address="0x00002794" value="0x0000FFCF" />
+        <register type="OA" address="0x00002798" value="0x00100082" />
+        <register type="OA" address="0x0000279C" value="0x0000FFEF" />
+        <register type="OA" address="0x000027A0" value="0x001000C2" />
+        <register type="OA" address="0x000027A4" value="0x0000FFE7" />
+        <register type="OA" address="0x000027A8" value="0x00100001" />
+        <register type="OA" address="0x000027AC" value="0x0000FFE7" />
+    </register_config>
+  </set>
+
+  <set name="Metric set PMA Stall"
+       mdapi_supported_apis="VK VK OGL OGL4 OCL IO MEDIA"
+       underscore_name="pma__stall"
+       hw_config_guid="befe9fd6-474e-4a3d-b98e-cd793715cf91"
+       chipset="SKLGT4"
+       symbol_name="PMA_Stall"
+       >
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="STC PMA stall"
+             description="Percentage of time when stencil cache line and an overlapping pixel are causing stalls"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ B 1 READ FADD 2 FDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="stc_pma_stall"
+             units="percent"
+             symbol_name="StcPMAStall"
+             availability="$SliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_group="GPU/Stencil Cache"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x122D3080" />
+        <register type="NOA" address="0x00009888" value="0x000D2000" />
+        <register type="NOA" address="0x00009888" value="0x060D8000" />
+        <register type="NOA" address="0x00009888" value="0x080DA000" />
+        <register type="NOA" address="0x00009888" value="0x0A0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F0800" />
+        <register type="NOA" address="0x00009888" value="0x0E0FAA00" />
+        <register type="NOA" address="0x00009888" value="0x100F0002" />
+        <register type="NOA" address="0x00009888" value="0x002D0025" />
+        <register type="NOA" address="0x00009888" value="0x062D1300" />
+        <register type="NOA" address="0x00009888" value="0x082D16A4" />
+        <register type="NOA" address="0x00009888" value="0x0A2D162E" />
+        <register type="NOA" address="0x00009888" value="0x102D0000" />
+        <register type="NOA" address="0x00009888" value="0x1190003F" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900000" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900000" />
+        <register type="NOA" address="0x00009888" value="0x47900000" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x30800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00E00021" />
+        <register type="OA" address="0x00002774" value="0x0007FFF8" />
+        <register type="OA" address="0x00002778" value="0x07000101" />
+        <register type="OA" address="0x0000277C" value="0x0038FFC7" />
+    </register_config>
+  </set>
+
+</metrics>
diff --git a/lib/i915/perf-configs/oa-tgl.xml b/lib/i915/perf-configs/oa-tgl.xml
new file mode 100644
index 00000000..095d9229
--- /dev/null
+++ b/lib/i915/perf-configs/oa-tgl.xml
@@ -0,0 +1,8491 @@
+<?xml version="1.0"?>
+<metrics version="1581936326" merge_md5="">
+  <set name="Render Metrics Basic Gen12"
+       mdapi_supported_apis="VK OGL OCL IO"
+       underscore_name="render_basic"
+       hw_config_guid="daf004fb-fc9f-45e0-b842-1770e6d273c2"
+       chipset="TGL"
+       symbol_name="RenderBasic"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS EM Pipe Active"
+             description="The percentage of time in which EU EM pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_em_active"
+             units="percent"
+             symbol_name="VsEmActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Samplers Busy"
+             description="The percentage of time in which samplers have been processing EU requests."
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ GPU_CLOCK 0 READ FDIV"
+             underscore_name="samplers_busy"
+             units="percent"
+             symbol_name="SamplersBusy"
+             availability="$DualSubsliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="PS EM Pipe Active"
+             description="The percentage of time in which EU EM pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_em_active"
+             units="percent"
+             symbol_name="PsEmActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="PS FPU Pipe Active"
+             description="The percentage of time in which EU FPU pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu_active"
+             units="percent"
+             symbol_name="PsFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU Pipe Active"
+             description="The percentage of time in which EU FPU pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu_active"
+             units="percent"
+             symbol_name="VsFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO MEDIA"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL OCL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Read Throughput"
+             description="The total number of GPU memory bytes read from GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="64  C 5 READ C 4 READ UADD C 3 READ UADD C 2 READ UADD UMUL"
+             underscore_name="gti_read_throughput"
+             units="bytes"
+             symbol_name="GtiReadThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="IO"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="EU FPU And EM Pipes Active"
+             description="The percentage of time in which EU FPU and EM pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_em_active"
+             units="percent"
+             symbol_name="EuFpuEmActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samplers Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which samplers have been slowing down the pipe when processing EU requests."
+             data_type="float"
+             high_watermark="15"
+             equation="C 6 READ GPU_CLOCK 0 READ FDIV"
+             max_equation="100"
+             underscore_name="sampler_bottleneck"
+             units="percent"
+             symbol_name="SamplerBottleneck"
+             availability="$DualSubsliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Indicate System Frame Batch Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="GTI Write Throughput"
+             description="The total number of GPU memory bytes written to GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="64  C 1 READ C 0 READ UADD UMUL"
+             underscore_name="gti_write_throughput"
+             units="bytes"
+             symbol_name="GtiWriteThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="IO"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ A 31 READ UADD A 32 READ UADD 64 UMUL"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL OCL IO"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL OCL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009840" value="0x00000000" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x14150001" />
+        <register type="NOA" address="0x00009888" value="0x0A124000" />
+        <register type="NOA" address="0x00009888" value="0x0C124000" />
+        <register type="NOA" address="0x00009888" value="0x1A138000" />
+        <register type="NOA" address="0x00009888" value="0x1C130100" />
+        <register type="NOA" address="0x00009888" value="0x04155100" />
+        <register type="NOA" address="0x00009888" value="0x06150050" />
+        <register type="NOA" address="0x00009888" value="0x10150000" />
+        <register type="NOA" address="0x00009888" value="0x1A150000" />
+        <register type="NOA" address="0x00009888" value="0x34001000" />
+        <register type="NOA" address="0x00009888" value="0x36000002" />
+        <register type="NOA" address="0x00009888" value="0x2205A000" />
+        <register type="NOA" address="0x00009884" value="0x00000003" />
+        <register type="NOA" address="0x00009888" value="0x05151D47" />
+        <register type="NOA" address="0x00009888" value="0x09151536" />
+        <register type="NOA" address="0x00009888" value="0x05351C00" />
+        <register type="NOA" address="0x00009888" value="0x09351400" />
+        <register type="NOA" address="0x00009888" value="0x5D102C00" />
+        <register type="NOA" address="0x00009888" value="0x5B1005BB" />
+        <register type="NOA" address="0x00009888" value="0x1B141800" />
+        <register type="NOA" address="0x00009888" value="0x5F110500" />
+        <register type="NOA" address="0x00009888" value="0x0B128000" />
+        <register type="NOA" address="0x00009888" value="0x0D128000" />
+        <register type="NOA" address="0x00009888" value="0x1F150137" />
+        <register type="NOA" address="0x00009888" value="0x01150000" />
+        <register type="NOA" address="0x00009888" value="0x0F168000" />
+        <register type="NOA" address="0x00009888" value="0x03164000" />
+        <register type="NOA" address="0x00009888" value="0x05164000" />
+        <register type="NOA" address="0x00009888" value="0x1D350137" />
+        <register type="NOA" address="0x00009888" value="0x03350147" />
+        <register type="NOA" address="0x00009888" value="0x07350136" />
+        <register type="NOA" address="0x00009888" value="0x01350000" />
+        <register type="NOA" address="0x00009888" value="0x0F364000" />
+        <register type="NOA" address="0x00009888" value="0x01368000" />
+        <register type="NOA" address="0x00009888" value="0x03368000" />
+        <register type="NOA" address="0x00009888" value="0x17100000" />
+        <register type="NOA" address="0x00009888" value="0x55103130" />
+        <register type="NOA" address="0x00009888" value="0x57100001" />
+        <register type="NOA" address="0x00009888" value="0x47103000" />
+        <register type="NOA" address="0x00009888" value="0x49103131" />
+        <register type="NOA" address="0x00009888" value="0x4B100131" />
+        <register type="NOA" address="0x00009888" value="0x4D100000" />
+        <register type="NOA" address="0x00009888" value="0x31100000" />
+        <register type="NOA" address="0x00009884" value="0x00000003" />
+        <register type="NOA" address="0x00009888" value="0x65100002" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x42000001" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x0000D920" value="0x00000000" />
+        <register type="OA" address="0x0000D900" value="0x00000000" />
+        <register type="OA" address="0x0000D904" value="0x00800000" />
+        <register type="OA" address="0x0000D910" value="0x00000000" />
+        <register type="OA" address="0x0000D914" value="0x00800000" />
+        <register type="OA" address="0x0000DC40" value="0x00000000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0xFFFFFFFF" />
+    </register_config>
+  </set>
+
+  <set name="Compute Metrics Basic"
+       mdapi_supported_apis="VK OGL OCL IO"
+       underscore_name="compute_basic"
+       hw_config_guid="6ad92fc0-ed62-460c-b774-5353534c67ed"
+       chipset="TGL"
+       symbol_name="ComputeBasic"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU AVG IPC Rate"
+             description="The average rate of IPC calculated for 2 FPU pipelines."
+             data_type="float"
+             max_equation="2"
+             equation="A 9 READ A 10 READ A 11 READ FADD A 9 READ FSUB FDIV 1 FADD"
+             underscore_name="eu_avg_ipc_rate"
+             units="number"
+             symbol_name="EuAvgIpcRate"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO MEDIA"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EM Pipe Active"
+             description="The percentage of time in which EU EM pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="em_active"
+             units="percent"
+             symbol_name="EmActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="EU FPU Pipe Active"
+             description="The percentage of time in which EU FPU pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu_active"
+             units="percent"
+             symbol_name="FpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL OCL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Read Throughput"
+             description="The total number of GPU memory bytes read from GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="64  C 7 READ C 6 READ UADD C 5 READ UADD C 4 READ UADD UMUL"
+             underscore_name="gti_read_throughput"
+             units="bytes"
+             symbol_name="GtiReadThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="IO"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="EU FPU And EM Pipes Active"
+             description="The percentage of time in which EU FPU and EM pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_em_active"
+             units="percent"
+             symbol_name="EuFpuEmActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="EU Thread Occupancy"
+             description="The percentage of time in which hardware threads occupied EUs."
+             data_type="float"
+             max_equation="100"
+             equation="8 A 13 READ FMUL $EuThreadsCount FDIV $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_thread_occupancy"
+             units="percent"
+             symbol_name="EuThreadOccupancy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="GTI Write Throughput"
+             description="The total number of GPU memory bytes written to GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="64  C 3 READ C 2 READ UADD UMUL"
+             underscore_name="gti_write_throughput"
+             units="bytes"
+             symbol_name="GtiWriteThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="IO"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ A 31 READ UADD A 32 READ UADD 64 UMUL"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL OCL IO"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL OCL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="EU Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_send_active"
+             units="percent"
+             symbol_name="EuSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009840" value="0x00000000" />
+        <register type="NOA" address="0x00009884" value="0x00000003" />
+        <register type="NOA" address="0x00009888" value="0x05151D37" />
+        <register type="NOA" address="0x00009888" value="0x09151547" />
+        <register type="NOA" address="0x00009888" value="0x05351C00" />
+        <register type="NOA" address="0x00009888" value="0x09351400" />
+        <register type="NOA" address="0x00009888" value="0x5B100BBB" />
+        <register type="NOA" address="0x00009888" value="0x0D150136" />
+        <register type="NOA" address="0x00009888" value="0x01150000" />
+        <register type="NOA" address="0x00009888" value="0x03164000" />
+        <register type="NOA" address="0x00009888" value="0x05164000" />
+        <register type="NOA" address="0x00009888" value="0x07164000" />
+        <register type="NOA" address="0x00009888" value="0x03350137" />
+        <register type="NOA" address="0x00009888" value="0x07350147" />
+        <register type="NOA" address="0x00009888" value="0x0B350136" />
+        <register type="NOA" address="0x00009888" value="0x01350000" />
+        <register type="NOA" address="0x00009888" value="0x01368000" />
+        <register type="NOA" address="0x00009888" value="0x03368000" />
+        <register type="NOA" address="0x00009888" value="0x05368000" />
+        <register type="NOA" address="0x00009888" value="0x17100000" />
+        <register type="NOA" address="0x00009888" value="0x47100000" />
+        <register type="NOA" address="0x00009888" value="0x49100000" />
+        <register type="NOA" address="0x00009888" value="0x4B100000" />
+        <register type="NOA" address="0x00009888" value="0x4D100000" />
+        <register type="NOA" address="0x00009888" value="0x31100000" />
+        <register type="NOA" address="0x00009884" value="0x00000003" />
+        <register type="NOA" address="0x00009888" value="0x65100002" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x42000001" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x0000D920" value="0x00000000" />
+        <register type="OA" address="0x0000D900" value="0x00000000" />
+        <register type="OA" address="0x0000D904" value="0x00800000" />
+        <register type="OA" address="0x0000D910" value="0x00000000" />
+        <register type="OA" address="0x0000D914" value="0x00800000" />
+        <register type="OA" address="0x0000DC40" value="0x00000000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00000003" />
+        <register type="FLEX" address="0x0000E658" value="0x00002001" />
+        <register type="FLEX" address="0x0000E758" value="0x00000008" />
+        <register type="FLEX" address="0x0000E65C" value="0xFFFFFFFF" />
+    </register_config>
+  </set>
+
+  <set name="Render Metrics for 3D Pipeline Profile"
+       mdapi_supported_apis="VK OGL OCL IO"
+       underscore_name="render_pipe_profile"
+       hw_config_guid="77ae98cf-9a9e-4e35-be85-597b09ffbe53"
+       chipset="TGL"
+       symbol_name="RenderPipeProfile"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Bottleneck"
+             low_watermark="10"
+             description="The percentage of time in which vertex shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="30"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="vs_bottleneck"
+             units="percent"
+             symbol_name="VsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Hi-Depth Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which early hierarchical depth test pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="hi_depth_bottleneck"
+             units="percent"
+             symbol_name="HiDepthBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which geometry shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="gs_bottleneck"
+             units="percent"
+             symbol_name="GsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Geometry Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="BC Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which barycentric coordinates calculation pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="C 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="bc_bottleneck"
+             units="percent"
+             symbol_name="BcBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Barycentric Calc"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HS Stall"
+             description="The percentage of time in which hull stall pipeline stage was stalled."
+             data_type="float"
+             max_equation="100"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="hs_stall"
+             units="percent"
+             symbol_name="HsStall"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_group="3D Pipe/Hull Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO MEDIA"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="VF Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which vertex fetch pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="vf_bottleneck"
+             units="percent"
+             symbol_name="VfBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Input Assembler"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL OCL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Strip-Fans Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which strip-fans pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="10"
+             equation="C 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="sf_bottleneck"
+             units="percent"
+             symbol_name="SfBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Strip-Fans"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SF Stall"
+             description="The percentage of time in which strip-fans pipeline stage was stalled."
+             data_type="float"
+             max_equation="100"
+             equation="B 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sf_stall"
+             units="percent"
+             symbol_name="SfStall"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Strip-Fans"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HS Bottleneck"
+             low_watermark="3"
+             description="The percentage of time in which hull shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="9"
+             equation="B 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="hs_bottleneck"
+             units="percent"
+             symbol_name="HsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Hull Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="CL Stall"
+             description="The percentage of time in which clipper pipeline stage was stalled."
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="cl_stall"
+             units="percent"
+             symbol_name="ClStall"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_group="3D Pipe/Clipper"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SO Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which stream output pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="so_bottleneck"
+             units="percent"
+             symbol_name="SoBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Stream Output"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="DS Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which domain shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="ds_bottleneck"
+             units="percent"
+             symbol_name="DsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Domain Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Clipper Bottleneck"
+             low_watermark="10"
+             description="The percentage of time in which clipper pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="30"
+             equation="C 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="cl_bottleneck"
+             units="percent"
+             symbol_name="ClBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Clipper"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Stall"
+             description="The percentage of time in which domain shader pipeline stage was stalled."
+             data_type="float"
+             max_equation="100"
+             equation="C 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ds_stall"
+             units="percent"
+             symbol_name="DsStall"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_group="3D Pipe/Domain Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ A 31 READ UADD A 32 READ UADD 64 UMUL"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL OCL IO"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL OCL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SO Stall"
+             description="The percentage of time in which stream-output pipeline stage was stalled."
+             data_type="float"
+             max_equation="100"
+             equation="B 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="so_stall"
+             units="percent"
+             symbol_name="SoStall"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_group="3D Pipe/Stream Output"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009840" value="0x00000000" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x00123E00" />
+        <register type="NOA" address="0x00009888" value="0x060B00B3" />
+        <register type="NOA" address="0x00009888" value="0x140B3C00" />
+        <register type="NOA" address="0x00009888" value="0x1C0B0000" />
+        <register type="NOA" address="0x00009888" value="0x120C8320" />
+        <register type="NOA" address="0x00009888" value="0x040DBE00" />
+        <register type="NOA" address="0x00009888" value="0x000D0000" />
+        <register type="NOA" address="0x00009888" value="0x280D0000" />
+        <register type="NOA" address="0x00009888" value="0x2C0E7C00" />
+        <register type="NOA" address="0x00009888" value="0x10087C00" />
+        <register type="NOA" address="0x00009888" value="0x1E120002" />
+        <register type="NOA" address="0x00009888" value="0x20120000" />
+        <register type="NOA" address="0x00009888" value="0x1E130002" />
+        <register type="NOA" address="0x00009888" value="0x0E0B0031" />
+        <register type="NOA" address="0x00009888" value="0x180B0092" />
+        <register type="NOA" address="0x00009888" value="0x1A0B00B1" />
+        <register type="NOA" address="0x00009888" value="0x020B0093" />
+        <register type="NOA" address="0x00009888" value="0x040B0033" />
+        <register type="NOA" address="0x00009888" value="0x000B0000" />
+        <register type="NOA" address="0x00009888" value="0x0A0C0022" />
+        <register type="NOA" address="0x00009888" value="0x1E0C0030" />
+        <register type="NOA" address="0x00009888" value="0x1C0C8000" />
+        <register type="NOA" address="0x00009888" value="0x140C8000" />
+        <register type="NOA" address="0x00009888" value="0x160C8000" />
+        <register type="NOA" address="0x00009888" value="0x100DC017" />
+        <register type="NOA" address="0x00009888" value="0x160D0013" />
+        <register type="NOA" address="0x00009888" value="0x1C0D0081" />
+        <register type="NOA" address="0x00009888" value="0x080D0082" />
+        <register type="NOA" address="0x00009888" value="0x0A0D8102" />
+        <register type="NOA" address="0x00009888" value="0x140D0000" />
+        <register type="NOA" address="0x00009888" value="0x0C0D0000" />
+        <register type="NOA" address="0x00009888" value="0x0E0D4000" />
+        <register type="NOA" address="0x00009888" value="0x120D0000" />
+        <register type="NOA" address="0x00009888" value="0x060DC000" />
+        <register type="NOA" address="0x00009888" value="0x0C0EC1C5" />
+        <register type="NOA" address="0x00009888" value="0x180E0000" />
+        <register type="NOA" address="0x00009888" value="0x0E0E8000" />
+        <register type="NOA" address="0x00009888" value="0x100E4000" />
+        <register type="NOA" address="0x00009888" value="0x120EC000" />
+        <register type="NOA" address="0x00009888" value="0x140EC000" />
+        <register type="NOA" address="0x00009888" value="0x160E4000" />
+        <register type="NOA" address="0x00009888" value="0x080E8000" />
+        <register type="NOA" address="0x00009888" value="0x0A0EC000" />
+        <register type="NOA" address="0x00009888" value="0x1C0F5555" />
+        <register type="NOA" address="0x00009888" value="0x1E0F0554" />
+        <register type="NOA" address="0x00009888" value="0x0E104000" />
+        <register type="NOA" address="0x00009888" value="0x10104000" />
+        <register type="NOA" address="0x00009888" value="0x14104000" />
+        <register type="NOA" address="0x00009888" value="0x16104000" />
+        <register type="NOA" address="0x00009888" value="0x18104000" />
+        <register type="NOA" address="0x00009888" value="0x1A104000" />
+        <register type="NOA" address="0x00009888" value="0x1C104000" />
+        <register type="NOA" address="0x00009888" value="0x02104000" />
+        <register type="NOA" address="0x00009888" value="0x04104000" />
+        <register type="NOA" address="0x00009888" value="0x06104000" />
+        <register type="NOA" address="0x00009888" value="0x08104000" />
+        <register type="NOA" address="0x00009888" value="0x0A104000" />
+        <register type="NOA" address="0x00009888" value="0x0C104000" />
+        <register type="NOA" address="0x00009888" value="0x0E024000" />
+        <register type="NOA" address="0x00009888" value="0x10024000" />
+        <register type="NOA" address="0x00009888" value="0x2C024000" />
+        <register type="NOA" address="0x00009888" value="0x2E020055" />
+        <register type="NOA" address="0x00009888" value="0x02024000" />
+        <register type="NOA" address="0x00009888" value="0x04024000" />
+        <register type="NOA" address="0x00009888" value="0x06024000" />
+        <register type="NOA" address="0x00009888" value="0x08024000" />
+        <register type="NOA" address="0x00009888" value="0x0A024000" />
+        <register type="NOA" address="0x00009888" value="0x0C024000" />
+        <register type="NOA" address="0x00009888" value="0x1A032000" />
+        <register type="NOA" address="0x00009888" value="0x1C032000" />
+        <register type="NOA" address="0x00009888" value="0x2A035500" />
+        <register type="NOA" address="0x00009888" value="0x2C030001" />
+        <register type="NOA" address="0x00009888" value="0x02034000" />
+        <register type="NOA" address="0x00009888" value="0x04034000" />
+        <register type="NOA" address="0x00009888" value="0x06034000" />
+        <register type="NOA" address="0x00009888" value="0x08034000" />
+        <register type="NOA" address="0x00009888" value="0x0A034000" />
+        <register type="NOA" address="0x00009888" value="0x18032000" />
+        <register type="NOA" address="0x00009888" value="0x360036DB" />
+        <register type="NOA" address="0x00009888" value="0x380026DB" />
+        <register type="NOA" address="0x00009888" value="0x1A006000" />
+        <register type="NOA" address="0x00009888" value="0x1C006000" />
+        <register type="NOA" address="0x00009888" value="0x1E006000" />
+        <register type="NOA" address="0x00009888" value="0x34001B00" />
+        <register type="NOA" address="0x00009888" value="0x26050002" />
+        <register type="NOA" address="0x00009888" value="0x0E0A8000" />
+        <register type="NOA" address="0x00009888" value="0x100A8000" />
+        <register type="NOA" address="0x00009888" value="0x120A4000" />
+        <register type="NOA" address="0x00009888" value="0x140A8000" />
+        <register type="NOA" address="0x00009888" value="0x160A8000" />
+        <register type="NOA" address="0x00009888" value="0x180A8000" />
+        <register type="NOA" address="0x00009888" value="0x1A0A8000" />
+        <register type="NOA" address="0x00009888" value="0x1C0A8000" />
+        <register type="NOA" address="0x00009888" value="0x020A8000" />
+        <register type="NOA" address="0x00009888" value="0x040A8000" />
+        <register type="NOA" address="0x00009888" value="0x060A8000" />
+        <register type="NOA" address="0x00009888" value="0x080A8000" />
+        <register type="NOA" address="0x00009888" value="0x0A0A8000" />
+        <register type="NOA" address="0x00009888" value="0x0C0A8000" />
+        <register type="NOA" address="0x00009888" value="0x08081000" />
+        <register type="NOA" address="0x00009884" value="0x00000003" />
+        <register type="NOA" address="0x00009888" value="0x5B105555" />
+        <register type="NOA" address="0x00009888" value="0x5D101555" />
+        <register type="NOA" address="0x00009888" value="0x1B14FC00" />
+        <register type="NOA" address="0x00009888" value="0x1D14003F" />
+        <register type="NOA" address="0x00009888" value="0x13148000" />
+        <register type="NOA" address="0x00009888" value="0x15148000" />
+        <register type="NOA" address="0x00009888" value="0x17148000" />
+        <register type="NOA" address="0x00009888" value="0x5F115555" />
+        <register type="NOA" address="0x00009888" value="0x61111555" />
+        <register type="NOA" address="0x00009888" value="0x0F128000" />
+        <register type="NOA" address="0x00009888" value="0x11128000" />
+        <register type="NOA" address="0x00009888" value="0x13128000" />
+        <register type="NOA" address="0x00009888" value="0x15128000" />
+        <register type="NOA" address="0x00009888" value="0x17128000" />
+        <register type="NOA" address="0x00009888" value="0x19128000" />
+        <register type="NOA" address="0x00009888" value="0x1B128000" />
+        <register type="NOA" address="0x00009888" value="0x1D128000" />
+        <register type="NOA" address="0x00009888" value="0x1F128000" />
+        <register type="NOA" address="0x00009888" value="0x03128000" />
+        <register type="NOA" address="0x00009888" value="0x05128000" />
+        <register type="NOA" address="0x00009888" value="0x07128000" />
+        <register type="NOA" address="0x00009888" value="0x09128000" />
+        <register type="NOA" address="0x00009888" value="0x0B128000" />
+        <register type="NOA" address="0x00009888" value="0x0D128000" />
+        <register type="NOA" address="0x00009888" value="0x4D100604" />
+        <register type="NOA" address="0x00009888" value="0x4F103400" />
+        <register type="NOA" address="0x00009888" value="0x51100200" />
+        <register type="NOA" address="0x00009888" value="0x53100004" />
+        <register type="NOA" address="0x00009888" value="0x55101400" />
+        <register type="NOA" address="0x00009888" value="0x17100000" />
+        <register type="NOA" address="0x00009888" value="0x31100000" />
+        <register type="NOA" address="0x00009888" value="0x57100005" />
+        <register type="NOA" address="0x00009888" value="0x47100000" />
+        <register type="NOA" address="0x00009888" value="0x49100000" />
+        <register type="NOA" address="0x00009888" value="0x4B100400" />
+        <register type="NOA" address="0x00009884" value="0x00000003" />
+        <register type="NOA" address="0x00009888" value="0x65100002" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x42000001" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x0000D920" value="0x00000000" />
+        <register type="OA" address="0x0000D900" value="0x00000000" />
+        <register type="OA" address="0x0000D904" value="0x00800000" />
+        <register type="OA" address="0x0000D910" value="0x00000000" />
+        <register type="OA" address="0x0000D914" value="0x00800000" />
+        <register type="OA" address="0x0000DC40" value="0x00000000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+    </register_config>
+  </set>
+
+  <set name="Metric set HDCAndSF"
+       mdapi_supported_apis="VK OGL OCL IO"
+       underscore_name="hdc_and_sf"
+       hw_config_guid="dedd95cd-1bd4-4e65-be7f-1fd7aa43fe12"
+       chipset="TGL"
+       symbol_name="HDCAndSF"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS EM Pipe Active"
+             description="The percentage of time in which EU EM pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_em_active"
+             units="percent"
+             symbol_name="VsEmActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="Polygon Data Ready"
+             description="The percentage of time in which geometry pipeline output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="B 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="poly_data_ready"
+             units="percent"
+             symbol_name="PolyDataReady"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe/Strip-Fans"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Slice0 Dualsubslice4 Non-sampler Shader Access Stalled On L3"
+             description="Percentage of time when HDC has messages to L3, but it's stalled due to lack of credits (Slice0 Dualsubslice4)"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader04_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader04AccessStalledOnL3"
+             availability="$DualSubsliceMask 16 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="PS EM Pipe Active"
+             description="The percentage of time in which EU EM pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_em_active"
+             units="percent"
+             symbol_name="PsEmActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="PS FPU Pipe Active"
+             description="The percentage of time in which EU FPU pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu_active"
+             units="percent"
+             symbol_name="PsFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU Pipe Active"
+             description="The percentage of time in which EU FPU pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu_active"
+             units="percent"
+             symbol_name="VsFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="Slice0 Dualsubslice1 Non-sampler Shader Access Stalled On L3"
+             description="Percentage of time when HDC has messages to L3, but it's stalled due to lack of credits (Slice0 Dualsubslice1)"
+             data_type="float"
+             max_equation="100"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader01_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader01AccessStalledOnL3"
+             availability="$DualSubsliceMask 2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO MEDIA"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="Slice0 Dualsubslice2 Non-sampler Shader Access Stalled On L3"
+             description="Percentage of time when HDC has messages to L3, but it's stalled due to lack of credits (Slice0 Dualsubslice2)"
+             data_type="float"
+             max_equation="100"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader02_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader02AccessStalledOnL3"
+             availability="$DualSubsliceMask 4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL OCL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="EU FPU And EM Pipes Active"
+             description="The percentage of time in which EU FPU and EM pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_em_active"
+             units="percent"
+             symbol_name="EuFpuEmActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ A 31 READ UADD A 32 READ UADD 64 UMUL"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL OCL IO"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Slice0 Dualsubslice0 Non-sampler Shader Access Stalled On L3"
+             description="Percentage of time when HDC has messages to L3, but it's stalled due to lack of credits (Slice0 Dualsubslice0)"
+             data_type="float"
+             max_equation="100"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader00_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader00AccessStalledOnL3"
+             availability="$DualSubsliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL OCL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 Dualsubslice3 Non-sampler Shader Access Stalled On L3"
+             description="Percentage of time when HDC has messages to L3, but it's stalled due to lack of credits (Slice0 Dualsubslice3)"
+             data_type="float"
+             max_equation="100"
+             equation="B 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader03_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader03AccessStalledOnL3"
+             availability="$DualSubsliceMask 8 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Slice0 Dualsubslice5 Non-sampler Shader Access Stalled On L3"
+             description="Percentage of time when HDC has messages to L3, but it's stalled due to lack of credits (Slice0 Dualsubslice5)"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader05_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader05AccessStalledOnL3"
+             availability="$DualSubsliceMask 32 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009840" value="0x00000000" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x14112400" />
+        <register type="NOA" address="0x00009888" value="0x14312400" />
+        <register type="NOA" address="0x00009888" value="0x14512474" />
+        <register type="NOA" address="0x00009888" value="0x14712400" />
+        <register type="NOA" address="0x00009888" value="0x14912400" />
+        <register type="NOA" address="0x00009888" value="0x14B12400" />
+        <register type="NOA" address="0x00009888" value="0x240A0019" />
+        <register type="NOA" address="0x00009888" value="0x1C07C000" />
+        <register type="NOA" address="0x00009888" value="0x24070002" />
+        <register type="NOA" address="0x00009888" value="0x10110074" />
+        <register type="NOA" address="0x00009888" value="0x08110000" />
+        <register type="NOA" address="0x00009888" value="0x10128000" />
+        <register type="NOA" address="0x00009888" value="0x1C130400" />
+        <register type="NOA" address="0x00009888" value="0x12310074" />
+        <register type="NOA" address="0x00009888" value="0x10310000" />
+        <register type="NOA" address="0x00009888" value="0x08310000" />
+        <register type="NOA" address="0x00009888" value="0x12328000" />
+        <register type="NOA" address="0x00009888" value="0x1C330800" />
+        <register type="NOA" address="0x00009888" value="0x10510000" />
+        <register type="NOA" address="0x00009888" value="0x0A510000" />
+        <register type="NOA" address="0x00009888" value="0x14528000" />
+        <register type="NOA" address="0x00009888" value="0x1C531000" />
+        <register type="NOA" address="0x00009888" value="0x16710074" />
+        <register type="NOA" address="0x00009888" value="0x10710000" />
+        <register type="NOA" address="0x00009888" value="0x0A710000" />
+        <register type="NOA" address="0x00009888" value="0x16728000" />
+        <register type="NOA" address="0x00009888" value="0x1C732000" />
+        <register type="NOA" address="0x00009888" value="0x0E910074" />
+        <register type="NOA" address="0x00009888" value="0x10910000" />
+        <register type="NOA" address="0x00009888" value="0x06910000" />
+        <register type="NOA" address="0x00009888" value="0x0E928000" />
+        <register type="NOA" address="0x00009888" value="0x1C930200" />
+        <register type="NOA" address="0x00009888" value="0x00B10074" />
+        <register type="NOA" address="0x00009888" value="0x10B10000" />
+        <register type="NOA" address="0x00009888" value="0x00B28000" />
+        <register type="NOA" address="0x00009888" value="0x10B38000" />
+        <register type="NOA" address="0x00009888" value="0x1E0F0020" />
+        <register type="NOA" address="0x00009888" value="0x16104000" />
+        <register type="NOA" address="0x00009888" value="0x2E020001" />
+        <register type="NOA" address="0x00009888" value="0x2A030600" />
+        <register type="NOA" address="0x00009888" value="0x18002000" />
+        <register type="NOA" address="0x00009888" value="0x36003488" />
+        <register type="NOA" address="0x00009888" value="0x3800001B" />
+        <register type="NOA" address="0x00009888" value="0x00014000" />
+        <register type="NOA" address="0x00009888" value="0x1A012000" />
+        <register type="NOA" address="0x00009888" value="0x24050038" />
+        <register type="NOA" address="0x00009888" value="0x24060080" />
+        <register type="NOA" address="0x00009888" value="0x180A00F7" />
+        <register type="NOA" address="0x00009888" value="0x200A0000" />
+        <register type="NOA" address="0x00009888" value="0x140A8000" />
+        <register type="NOA" address="0x00009888" value="0x160A8000" />
+        <register type="NOA" address="0x00009884" value="0x00000003" />
+        <register type="NOA" address="0x00009888" value="0x41104000" />
+        <register type="NOA" address="0x00009888" value="0x5B105000" />
+        <register type="NOA" address="0x00009888" value="0x5D100055" />
+        <register type="NOA" address="0x00009888" value="0x11148000" />
+        <register type="NOA" address="0x00009888" value="0x1B14E000" />
+        <register type="NOA" address="0x00009888" value="0x1D140007" />
+        <register type="NOA" address="0x00009888" value="0x4B112000" />
+        <register type="NOA" address="0x00009888" value="0x5F115000" />
+        <register type="NOA" address="0x00009888" value="0x61110055" />
+        <register type="NOA" address="0x00009888" value="0x01128000" />
+        <register type="NOA" address="0x00009888" value="0x0F128000" />
+        <register type="NOA" address="0x00009888" value="0x11128000" />
+        <register type="NOA" address="0x00009888" value="0x13128000" />
+        <register type="NOA" address="0x00009888" value="0x15128000" />
+        <register type="NOA" address="0x00009888" value="0x17128000" />
+        <register type="NOA" address="0x00009888" value="0x19128000" />
+        <register type="NOA" address="0x00009888" value="0x47100600" />
+        <register type="NOA" address="0x00009888" value="0x4D100000" />
+        <register type="NOA" address="0x00009888" value="0x4F101116" />
+        <register type="NOA" address="0x00009888" value="0x51100401" />
+        <register type="NOA" address="0x00009888" value="0x53100030" />
+        <register type="NOA" address="0x00009888" value="0x17100000" />
+        <register type="NOA" address="0x00009888" value="0x31100000" />
+        <register type="NOA" address="0x00009884" value="0x00000003" />
+        <register type="NOA" address="0x00009888" value="0x65100002" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x42000001" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x0000D920" value="0x00000000" />
+        <register type="OA" address="0x0000D900" value="0x00000000" />
+        <register type="OA" address="0x0000D904" value="0xF0800000" />
+        <register type="OA" address="0x0000D910" value="0x00000000" />
+        <register type="OA" address="0x0000D914" value="0x70800000" />
+        <register type="OA" address="0x0000DC40" value="0x007F0000" />
+        <register type="OA" address="0x0000D940" value="0x00000002" />
+        <register type="OA" address="0x0000D944" value="0x0000FFFE" />
+        <register type="OA" address="0x0000DC00" value="0x00000002" />
+        <register type="OA" address="0x0000DC04" value="0x0000FFFE" />
+        <register type="OA" address="0x0000D948" value="0x00000002" />
+        <register type="OA" address="0x0000D94C" value="0x0000FFFD" />
+        <register type="OA" address="0x0000DC08" value="0x00000002" />
+        <register type="OA" address="0x0000DC0C" value="0x0000FFFD" />
+        <register type="OA" address="0x0000D950" value="0x00000002" />
+        <register type="OA" address="0x0000D954" value="0x0000FFFB" />
+        <register type="OA" address="0x0000DC10" value="0x00000002" />
+        <register type="OA" address="0x0000DC14" value="0x0000FFFB" />
+        <register type="OA" address="0x0000D958" value="0x00000002" />
+        <register type="OA" address="0x0000D95C" value="0x0000FFF7" />
+        <register type="OA" address="0x0000DC18" value="0x00000002" />
+        <register type="OA" address="0x0000DC1C" value="0x0000FFF7" />
+        <register type="OA" address="0x0000D960" value="0x00000002" />
+        <register type="OA" address="0x0000D964" value="0x0000FFEF" />
+        <register type="OA" address="0x0000DC20" value="0x00000002" />
+        <register type="OA" address="0x0000DC24" value="0x0000FFEF" />
+        <register type="OA" address="0x0000D968" value="0x00000002" />
+        <register type="OA" address="0x0000D96C" value="0x0000FFDF" />
+        <register type="OA" address="0x0000DC28" value="0x00000002" />
+        <register type="OA" address="0x0000DC2C" value="0x0000FFDF" />
+        <register type="OA" address="0x0000D970" value="0x00000002" />
+        <register type="OA" address="0x0000D974" value="0x0000FFBF" />
+        <register type="OA" address="0x0000DC30" value="0x00000002" />
+        <register type="OA" address="0x0000DC34" value="0x0000FFBF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+    </register_config>
+  </set>
+
+  <set name="Metric set RasterizerAndPixelBackend"
+       mdapi_supported_apis="VK OGL OCL IO"
+       underscore_name="rasterizer_and_pixel_backend"
+       hw_config_guid="a889ccb3-5ebd-437f-b5c6-e951fba822f5"
+       chipset="TGL"
+       symbol_name="RasterizerAndPixelBackend"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 Pipe0 PS Output Available"
+             description="The percentage of time in which slice0 pipe0 PS output is available"
+             data_type="float"
+             max_equation="100"
+             equation="C 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_output00_available"
+             units="percent"
+             symbol_name="PSOutput00Available"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="VS EM Pipe Active"
+             description="The percentage of time in which EU EM pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_em_active"
+             units="percent"
+             symbol_name="VsEmActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Slice0 Pipe1 PS Output Available"
+             description="The percentage of time in which slice0 pipe1 PS output is available"
+             data_type="float"
+             max_equation="100"
+             equation="C 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_output01_available"
+             units="percent"
+             symbol_name="PSOutput01Available"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Slice0 Pipe1 Pixel Values Ready"
+             description="The percentage of time in which slice0 pipe1 pixel values are ready"
+             data_type="float"
+             max_equation="100"
+             equation="B 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="pixel_values01_ready"
+             units="percent"
+             symbol_name="PixelValues01Ready"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="PS EM Pipe Active"
+             description="The percentage of time in which EU EM pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_em_active"
+             units="percent"
+             symbol_name="PsEmActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="PS FPU Pipe Active"
+             description="The percentage of time in which EU FPU pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu_active"
+             units="percent"
+             symbol_name="PsFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU Pipe Active"
+             description="The percentage of time in which EU FPU pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu_active"
+             units="percent"
+             symbol_name="VsFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="Slice0 Pipe0 Post-EarlyZ Pixel Data Ready"
+             description="The percentage of time in which slice0  pipe0 post-EarlyZ pixel data is ready (after early Z tests have been applied)"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="pixel_data00_ready"
+             units="percent"
+             symbol_name="PixelData00Ready"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer/Early Depth Test"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO MEDIA"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="Slice0 Rasterizer Input Available"
+             description="The percentage of time in which slice0 rasterizer input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="rasterizer0_input_available"
+             units="percent"
+             symbol_name="Rasterizer0InputAvailable"
+             availability="$SliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL OCL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ01 is full"
+             description="The percentage of time when IDI0 SQ1 is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue01_full"
+             units="percent"
+             symbol_name="GTRequestQueue01Full"
+             semantic_type="duration"
+             mdapi_supported_apis="IO"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="Slice0 Pipe2 Pixel Values Ready"
+             description="The percentage of time in which slice0 pipe2 pixel values are ready"
+             data_type="float"
+             max_equation="100"
+             equation="B 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="pixel_values02_ready"
+             units="percent"
+             symbol_name="PixelValues02Ready"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="EU FPU And EM Pipes Active"
+             description="The percentage of time in which EU FPU and EM pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_em_active"
+             units="percent"
+             symbol_name="EuFpuEmActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 Pipe0 Pixel Values Ready"
+             description="The percentage of time in which slice0 pipe0 pixel values are ready"
+             data_type="float"
+             max_equation="100"
+             equation="B 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="pixel_values00_ready"
+             units="percent"
+             symbol_name="PixelValues00Ready"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="SQ10 is full"
+             description="The percentage of time when IDI1 SQ0 is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue10_full"
+             units="percent"
+             symbol_name="GTRequestQueue10Full"
+             semantic_type="duration"
+             mdapi_supported_apis="IO"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="SQ00 is full"
+             description="The percentage of time when IDI0 SQ0 is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue00_full"
+             units="percent"
+             symbol_name="GTRequestQueue00Full"
+             semantic_type="duration"
+             mdapi_supported_apis="IO"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 Pipe2 PS Output Available"
+             description="The percentage of time in which slice0 pipe2 PS output is available"
+             data_type="float"
+             max_equation="100"
+             equation="C 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_output02_available"
+             units="percent"
+             symbol_name="PSOutput02Available"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Slice0 Rasterizer Output Ready"
+             description="The percentage of time in which slice0 rasterizer output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="rasterizer0_output_ready"
+             units="percent"
+             symbol_name="Rasterizer0OutputReady"
+             availability="$SliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="SQ11 is full"
+             description="The percentage of time when IDI1 SQ1 is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue11_full"
+             units="percent"
+             symbol_name="GTRequestQueue11Full"
+             semantic_type="duration"
+             mdapi_supported_apis="IO"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ A 31 READ UADD A 32 READ UADD 64 UMUL"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL OCL IO"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="VK OGL OCL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009840" value="0x00000000" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x1E075000" />
+        <register type="NOA" address="0x00009888" value="0x1A0700C0" />
+        <register type="NOA" address="0x00009888" value="0x1E055000" />
+        <register type="NOA" address="0x00009888" value="0x1A0500C0" />
+        <register type="NOA" address="0x00009888" value="0x1E065000" />
+        <register type="NOA" address="0x00009888" value="0x1A0600C0" />
+        <register type="NOA" address="0x00009888" value="0x2A0A7300" />
+        <register type="NOA" address="0x00009888" value="0x2C0A0000" />
+        <register type="NOA" address="0x00009888" value="0x120800A0" />
+        <register type="NOA" address="0x00009888" value="0x0A07C000" />
+        <register type="NOA" address="0x00009888" value="0x0E070027" />
+        <register type="NOA" address="0x00009888" value="0x10070000" />
+        <register type="NOA" address="0x00009888" value="0x24070000" />
+        <register type="NOA" address="0x00009888" value="0x2A032000" />
+        <register type="NOA" address="0x00009888" value="0x2C030008" />
+        <register type="NOA" address="0x00009888" value="0x18006000" />
+        <register type="NOA" address="0x00009888" value="0x360036D8" />
+        <register type="NOA" address="0x00009888" value="0x38003299" />
+        <register type="NOA" address="0x00009888" value="0x1A004000" />
+        <register type="NOA" address="0x00009888" value="0x1C006000" />
+        <register type="NOA" address="0x00009888" value="0x2A010400" />
+        <register type="NOA" address="0x00009888" value="0x2C010001" />
+        <register type="NOA" address="0x00009888" value="0x0C05C000" />
+        <register type="NOA" address="0x00009888" value="0x00052700" />
+        <register type="NOA" address="0x00009888" value="0x10050000" />
+        <register type="NOA" address="0x00009888" value="0x24050000" />
+        <register type="NOA" address="0x00009888" value="0x22050000" />
+        <register type="NOA" address="0x00009888" value="0x0C0600C0" />
+        <register type="NOA" address="0x00009888" value="0x0E062700" />
+        <register type="NOA" address="0x00009888" value="0x10060000" />
+        <register type="NOA" address="0x00009888" value="0x24060000" />
+        <register type="NOA" address="0x00009888" value="0x26060000" />
+        <register type="NOA" address="0x00009888" value="0x000A0144" />
+        <register type="NOA" address="0x00009888" value="0x0E0A0145" />
+        <register type="NOA" address="0x00009888" value="0x100A0156" />
+        <register type="NOA" address="0x00009888" value="0x040A014F" />
+        <register type="NOA" address="0x00009888" value="0x200A0000" />
+        <register type="NOA" address="0x00009888" value="0x120A4000" />
+        <register type="NOA" address="0x00009888" value="0x140A4000" />
+        <register type="NOA" address="0x00009888" value="0x180A8000" />
+        <register type="NOA" address="0x00009888" value="0x1E0A8000" />
+        <register type="NOA" address="0x00009888" value="0x08081980" />
+        <register type="NOA" address="0x00009888" value="0x0A080032" />
+        <register type="NOA" address="0x00009888" value="0x10080000" />
+        <register type="NOA" address="0x00009884" value="0x00000003" />
+        <register type="NOA" address="0x00009888" value="0x31152800" />
+        <register type="NOA" address="0x00009888" value="0x331500A0" />
+        <register type="NOA" address="0x00009888" value="0x31352800" />
+        <register type="NOA" address="0x00009888" value="0x333500A0" />
+        <register type="NOA" address="0x00009888" value="0x41104000" />
+        <register type="NOA" address="0x00009888" value="0x5B105FA5" />
+        <register type="NOA" address="0x00009888" value="0x5D101555" />
+        <register type="NOA" address="0x00009888" value="0x11148000" />
+        <register type="NOA" address="0x00009888" value="0x1B14E000" />
+        <register type="NOA" address="0x00009888" value="0x1D14003F" />
+        <register type="NOA" address="0x00009888" value="0x13148000" />
+        <register type="NOA" address="0x00009888" value="0x15148000" />
+        <register type="NOA" address="0x00009888" value="0x4B112000" />
+        <register type="NOA" address="0x00009888" value="0x5F115005" />
+        <register type="NOA" address="0x00009888" value="0x61111555" />
+        <register type="NOA" address="0x00009888" value="0x01128000" />
+        <register type="NOA" address="0x00009888" value="0x0F128000" />
+        <register type="NOA" address="0x00009888" value="0x11128000" />
+        <register type="NOA" address="0x00009888" value="0x13128000" />
+        <register type="NOA" address="0x00009888" value="0x15128000" />
+        <register type="NOA" address="0x00009888" value="0x17128000" />
+        <register type="NOA" address="0x00009888" value="0x19128000" />
+        <register type="NOA" address="0x00009888" value="0x1B128000" />
+        <register type="NOA" address="0x00009888" value="0x1D128000" />
+        <register type="NOA" address="0x00009888" value="0x1F128000" />
+        <register type="NOA" address="0x00009888" value="0x03128000" />
+        <register type="NOA" address="0x00009888" value="0x05128000" />
+        <register type="NOA" address="0x00009888" value="0x07150016" />
+        <register type="NOA" address="0x00009888" value="0x09150096" />
+        <register type="NOA" address="0x00009888" value="0x01150000" />
+        <register type="NOA" address="0x00009888" value="0x03168000" />
+        <register type="NOA" address="0x00009888" value="0x05164000" />
+        <register type="NOA" address="0x00009888" value="0x0B350016" />
+        <register type="NOA" address="0x00009888" value="0x0D350096" />
+        <register type="NOA" address="0x00009888" value="0x01350000" />
+        <register type="NOA" address="0x00009888" value="0x05368000" />
+        <register type="NOA" address="0x00009888" value="0x07364000" />
+        <register type="NOA" address="0x00009888" value="0x47100400" />
+        <register type="NOA" address="0x00009888" value="0x4D100616" />
+        <register type="NOA" address="0x00009888" value="0x4F100404" />
+        <register type="NOA" address="0x00009888" value="0x51100202" />
+        <register type="NOA" address="0x00009888" value="0x53100002" />
+        <register type="NOA" address="0x00009888" value="0x55100204" />
+        <register type="NOA" address="0x00009888" value="0x17100000" />
+        <register type="NOA" address="0x00009888" value="0x31100000" />
+        <register type="NOA" address="0x00009888" value="0x57100000" />
+        <register type="NOA" address="0x00009888" value="0x49101404" />
+        <register type="NOA" address="0x00009888" value="0x4B101616" />
+        <register type="NOA" address="0x00009884" value="0x00000003" />
+        <register type="NOA" address="0x00009888" value="0x65100002" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x42000001" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x0000D920" value="0x00000000" />
+        <register type="OA" address="0x0000D900" value="0x00000000" />
+        <register type="OA" address="0x0000D904" value="0x30800000" />
+        <register type="OA" address="0x0000D910" value="0x00000000" />
+        <register type="OA" address="0x0000D914" value="0x00800000" />
+        <register type="OA" address="0x0000DC40" value="0x00030000" />
+        <register type="OA" address="0x0000D940" value="0x00000038" />
+        <register type="OA" address="0x0000D944" value="0x0000FFF8" />
+        <register type="OA" address="0x0000DC00" value="0x00000038" />
+        <register type="OA" address="0x0000DC04" value="0x0000FFF8" />
+        <register type="OA" address="0x0000D948" value="0x000000C0" />
+        <register type="OA" address="0x0000D94C" value="0x0000FFE7" />
+        <register type="OA" address="0x0000DC08" value="0x000000C0" />
+        <register type="OA" address="0x0000DC0C" value="0x0000FFE7" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+    </register_config>
+  </set>
+
+  <set name="Gen12LP L3_1"
+       mdapi_supported_apis="VK OGL OCL MEDIA IO"
+       underscore_name="l3_1"
+       hw_config_guid="feee2629-03a8-4d31-ab4d-7d16572163fb"
+       chipset="TGL"
+       symbol_name="L3_1"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank5 Input Available"
+             description="The percentage of time in which slice0 L3 bank5 has input available"
+             data_type="float"
+             max_equation="100"
+             equation="B 7 READ B 6 READ FADD B 5 READ FADD B 4 READ FADD 4 FDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank5_input_available"
+             units="percent"
+             symbol_name="L30Bank5InputAvailable"
+             availability="$SliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="EU FPU And EM Pipes Active"
+             description="The percentage of time in which EU FPU and EM pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_em_active"
+             units="percent"
+             symbol_name="EuFpuEmActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank0 Input Available"
+             description="The percentage of time in which slice0 L3 bank0 has input available"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ C 6 READ FADD C 5 READ FADD C 4 READ FADD 4 FDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank0_input_available"
+             units="percent"
+             symbol_name="L30Bank0InputAvailable"
+             availability="$SliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO MEDIA"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="EU Thread Occupancy"
+             description="The percentage of time in which hardware threads occupied EUs."
+             data_type="float"
+             max_equation="100"
+             equation="8 A 10 READ FMUL $EuThreadsCount FDIV $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_thread_occupancy"
+             units="percent"
+             symbol_name="EuThreadOccupancy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank1 Input Available"
+             description="The percentage of time in which slice0 L3 bank1 has input available"
+             data_type="float"
+             max_equation="100"
+             equation="C 3 READ C 2 READ FADD C 1 READ FADD C 0 READ FADD 4 FDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank1_input_available"
+             units="percent"
+             symbol_name="L30Bank1InputAvailable"
+             availability="$SliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank4 Input Available"
+             description="The percentage of time in which slice0 L3 bank4 has input available"
+             data_type="float"
+             max_equation="100"
+             equation="B 3 READ B 2 READ FADD B 1 READ FADD B 0 READ FADD 4 FDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank4_input_available"
+             units="percent"
+             symbol_name="L30Bank4InputAvailable"
+             availability="$SliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009840" value="0x00000000" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x04022000" />
+        <register type="NOA" address="0x00009888" value="0x06022800" />
+        <register type="NOA" address="0x00009888" value="0x04002827" />
+        <register type="NOA" address="0x00009888" value="0x0600202C" />
+        <register type="NOA" address="0x00009888" value="0x00020024" />
+        <register type="NOA" address="0x00009888" value="0x0E020025" />
+        <register type="NOA" address="0x00009888" value="0x10020026" />
+        <register type="NOA" address="0x00009888" value="0x12020027" />
+        <register type="NOA" address="0x00009888" value="0x1402002C" />
+        <register type="NOA" address="0x00009888" value="0x1602002D" />
+        <register type="NOA" address="0x00009888" value="0x1802002E" />
+        <register type="NOA" address="0x00009888" value="0x1A02002F" />
+        <register type="NOA" address="0x00009888" value="0x2E020000" />
+        <register type="NOA" address="0x00009888" value="0x2C020000" />
+        <register type="NOA" address="0x00009888" value="0x00034000" />
+        <register type="NOA" address="0x00009888" value="0x1A032000" />
+        <register type="NOA" address="0x00009888" value="0x1C032000" />
+        <register type="NOA" address="0x00009888" value="0x1E032000" />
+        <register type="NOA" address="0x00009888" value="0x2A035500" />
+        <register type="NOA" address="0x00009888" value="0x1C000024" />
+        <register type="NOA" address="0x00009888" value="0x1E000025" />
+        <register type="NOA" address="0x00009888" value="0x02000026" />
+        <register type="NOA" address="0x00009888" value="0x0800002D" />
+        <register type="NOA" address="0x00009888" value="0x0A00002E" />
+        <register type="NOA" address="0x00009888" value="0x0C00002F" />
+        <register type="NOA" address="0x00009888" value="0x360036D8" />
+        <register type="NOA" address="0x00009888" value="0x18006000" />
+        <register type="NOA" address="0x00009888" value="0x380000DB" />
+        <register type="NOA" address="0x00009888" value="0x1A000000" />
+        <register type="NOA" address="0x00009888" value="0x34000000" />
+        <register type="NOA" address="0x00009888" value="0x000A8000" />
+        <register type="NOA" address="0x00009888" value="0x0E0A8000" />
+        <register type="NOA" address="0x00009888" value="0x100A8000" />
+        <register type="NOA" address="0x00009888" value="0x120A8000" />
+        <register type="NOA" address="0x00009888" value="0x140A8000" />
+        <register type="NOA" address="0x00009888" value="0x160A8000" />
+        <register type="NOA" address="0x00009888" value="0x180A8000" />
+        <register type="NOA" address="0x00009888" value="0x1A0A8000" />
+        <register type="NOA" address="0x00009884" value="0x00000003" />
+        <register type="NOA" address="0x00009888" value="0x41104000" />
+        <register type="NOA" address="0x00009888" value="0x5B105555" />
+        <register type="NOA" address="0x00009888" value="0x5D101555" />
+        <register type="NOA" address="0x00009888" value="0x11148000" />
+        <register type="NOA" address="0x00009888" value="0x1B14FC00" />
+        <register type="NOA" address="0x00009888" value="0x1D14003F" />
+        <register type="NOA" address="0x00009888" value="0x13148000" />
+        <register type="NOA" address="0x00009888" value="0x15148000" />
+        <register type="NOA" address="0x00009888" value="0x17148000" />
+        <register type="NOA" address="0x00009888" value="0x4B112000" />
+        <register type="NOA" address="0x00009888" value="0x5F115555" />
+        <register type="NOA" address="0x00009888" value="0x61111555" />
+        <register type="NOA" address="0x00009888" value="0x01128000" />
+        <register type="NOA" address="0x00009888" value="0x0F128000" />
+        <register type="NOA" address="0x00009888" value="0x11128000" />
+        <register type="NOA" address="0x00009888" value="0x13128000" />
+        <register type="NOA" address="0x00009888" value="0x15128000" />
+        <register type="NOA" address="0x00009888" value="0x17128000" />
+        <register type="NOA" address="0x00009888" value="0x19128000" />
+        <register type="NOA" address="0x00009888" value="0x1B128000" />
+        <register type="NOA" address="0x00009888" value="0x1D128000" />
+        <register type="NOA" address="0x00009888" value="0x1F128000" />
+        <register type="NOA" address="0x00009888" value="0x03128000" />
+        <register type="NOA" address="0x00009888" value="0x05128000" />
+        <register type="NOA" address="0x00009888" value="0x07128000" />
+        <register type="NOA" address="0x00009888" value="0x09128000" />
+        <register type="NOA" address="0x00009888" value="0x0B128000" />
+        <register type="NOA" address="0x00009888" value="0x0D128000" />
+        <register type="NOA" address="0x00009888" value="0x47100000" />
+        <register type="NOA" address="0x00009888" value="0x4D100606" />
+        <register type="NOA" address="0x00009888" value="0x4F100000" />
+        <register type="NOA" address="0x00009888" value="0x51100000" />
+        <register type="NOA" address="0x00009888" value="0x53100000" />
+        <register type="NOA" address="0x00009888" value="0x55100600" />
+        <register type="NOA" address="0x00009888" value="0x17100000" />
+        <register type="NOA" address="0x00009888" value="0x31100000" />
+        <register type="NOA" address="0x00009888" value="0x57100006" />
+        <register type="NOA" address="0x00009888" value="0x49100606" />
+        <register type="NOA" address="0x00009888" value="0x4B100606" />
+        <register type="NOA" address="0x00009884" value="0x00000003" />
+        <register type="NOA" address="0x00009888" value="0x65100002" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x42000001" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x0000D920" value="0x00000000" />
+        <register type="OA" address="0x0000D900" value="0x00000000" />
+        <register type="OA" address="0x0000D904" value="0x00800000" />
+        <register type="OA" address="0x0000D910" value="0x00000000" />
+        <register type="OA" address="0x0000D914" value="0x00800000" />
+        <register type="OA" address="0x0000DC40" value="0x00000000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00008003" />
+    </register_config>
+  </set>
+
+  <set name="Gen12LP L3_2"
+       mdapi_supported_apis="VK OGL OCL MEDIA IO"
+       underscore_name="l3_2"
+       hw_config_guid="5266f235-1711-4eef-9493-ebdf0238d512"
+       chipset="TGL"
+       symbol_name="L3_2"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank3 Input Available"
+             description="The percentage of time in which slice0 L3 bank3 has input available"
+             data_type="float"
+             max_equation="100"
+             equation="B 7 READ B 6 READ FADD B 5 READ FADD B 4 READ FADD 4 FDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank3_input_available"
+             units="percent"
+             symbol_name="L30Bank3InputAvailable"
+             availability="$SliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Slice0 L3 Bank6 Input Available"
+             description="The percentage of time in which slice0 L3 bank6 has input available"
+             data_type="float"
+             max_equation="100"
+             equation="C 3 READ C 2 READ FADD C 1 READ FADD C 0 READ FADD 4 FDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank6_input_available"
+             units="percent"
+             symbol_name="L30Bank6InputAvailable"
+             availability="$SliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Slice0 L3 Bank2 Input Available"
+             description="The percentage of time in which slice0 L3 bank2 has input available"
+             data_type="float"
+             max_equation="100"
+             equation="B 3 READ B 2 READ FADD B 1 READ FADD B 0 READ FADD 4 FDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank2_input_available"
+             units="percent"
+             symbol_name="L30Bank2InputAvailable"
+             availability="$SliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="EU FPU And EM Pipes Active"
+             description="The percentage of time in which EU FPU and EM pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_em_active"
+             units="percent"
+             symbol_name="EuFpuEmActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO MEDIA"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="EU Thread Occupancy"
+             description="The percentage of time in which hardware threads occupied EUs."
+             data_type="float"
+             max_equation="100"
+             equation="8 A 10 READ FMUL $EuThreadsCount FDIV $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_thread_occupancy"
+             units="percent"
+             symbol_name="EuThreadOccupancy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank7 Input Available"
+             description="The percentage of time in which slice0 L3 bank7 has input available"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ C 6 READ FADD C 5 READ FADD C 4 READ FADD 4 FDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank7_input_available"
+             units="percent"
+             symbol_name="L30Bank7InputAvailable"
+             availability="$SliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009840" value="0x00000000" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x04023027" />
+        <register type="NOA" address="0x00009888" value="0x0602382C" />
+        <register type="NOA" address="0x00009888" value="0x04003000" />
+        <register type="NOA" address="0x00009888" value="0x06003800" />
+        <register type="NOA" address="0x00009888" value="0x1C020024" />
+        <register type="NOA" address="0x00009888" value="0x1E020025" />
+        <register type="NOA" address="0x00009888" value="0x02020026" />
+        <register type="NOA" address="0x00009888" value="0x0802002D" />
+        <register type="NOA" address="0x00009888" value="0x0A02002E" />
+        <register type="NOA" address="0x00009888" value="0x0C02002F" />
+        <register type="NOA" address="0x00009888" value="0x2E020000" />
+        <register type="NOA" address="0x00009888" value="0x2C030005" />
+        <register type="NOA" address="0x00009888" value="0x02034000" />
+        <register type="NOA" address="0x00009888" value="0x04034000" />
+        <register type="NOA" address="0x00009888" value="0x06034000" />
+        <register type="NOA" address="0x00009888" value="0x08034000" />
+        <register type="NOA" address="0x00009888" value="0x0A034000" />
+        <register type="NOA" address="0x00009888" value="0x18032000" />
+        <register type="NOA" address="0x00009888" value="0x00000024" />
+        <register type="NOA" address="0x00009888" value="0x0E000025" />
+        <register type="NOA" address="0x00009888" value="0x10000026" />
+        <register type="NOA" address="0x00009888" value="0x12000027" />
+        <register type="NOA" address="0x00009888" value="0x1400002C" />
+        <register type="NOA" address="0x00009888" value="0x1600002D" />
+        <register type="NOA" address="0x00009888" value="0x1800002E" />
+        <register type="NOA" address="0x00009888" value="0x1A00602F" />
+        <register type="NOA" address="0x00009888" value="0x36000003" />
+        <register type="NOA" address="0x00009888" value="0x38003600" />
+        <register type="NOA" address="0x00009888" value="0x1C006000" />
+        <register type="NOA" address="0x00009888" value="0x1E006000" />
+        <register type="NOA" address="0x00009888" value="0x34001B00" />
+        <register type="NOA" address="0x00009888" value="0x1C0A8000" />
+        <register type="NOA" address="0x00009888" value="0x1E0A8000" />
+        <register type="NOA" address="0x00009888" value="0x020A8000" />
+        <register type="NOA" address="0x00009888" value="0x040A8000" />
+        <register type="NOA" address="0x00009888" value="0x060A8000" />
+        <register type="NOA" address="0x00009888" value="0x080A8000" />
+        <register type="NOA" address="0x00009888" value="0x0A0A8000" />
+        <register type="NOA" address="0x00009888" value="0x0C0A8000" />
+        <register type="NOA" address="0x00009884" value="0x00000003" />
+        <register type="NOA" address="0x00009888" value="0x41104000" />
+        <register type="NOA" address="0x00009888" value="0x5B105555" />
+        <register type="NOA" address="0x00009888" value="0x5D101555" />
+        <register type="NOA" address="0x00009888" value="0x11148000" />
+        <register type="NOA" address="0x00009888" value="0x1B14FC00" />
+        <register type="NOA" address="0x00009888" value="0x1D14003F" />
+        <register type="NOA" address="0x00009888" value="0x13148000" />
+        <register type="NOA" address="0x00009888" value="0x15148000" />
+        <register type="NOA" address="0x00009888" value="0x17148000" />
+        <register type="NOA" address="0x00009888" value="0x4B112000" />
+        <register type="NOA" address="0x00009888" value="0x5F115555" />
+        <register type="NOA" address="0x00009888" value="0x61111555" />
+        <register type="NOA" address="0x00009888" value="0x01128000" />
+        <register type="NOA" address="0x00009888" value="0x0F128000" />
+        <register type="NOA" address="0x00009888" value="0x11128000" />
+        <register type="NOA" address="0x00009888" value="0x13128000" />
+        <register type="NOA" address="0x00009888" value="0x15128000" />
+        <register type="NOA" address="0x00009888" value="0x17128000" />
+        <register type="NOA" address="0x00009888" value="0x19128000" />
+        <register type="NOA" address="0x00009888" value="0x1B128000" />
+        <register type="NOA" address="0x00009888" value="0x1D128000" />
+        <register type="NOA" address="0x00009888" value="0x1F128000" />
+        <register type="NOA" address="0x00009888" value="0x03128000" />
+        <register type="NOA" address="0x00009888" value="0x05128000" />
+        <register type="NOA" address="0x00009888" value="0x07128000" />
+        <register type="NOA" address="0x00009888" value="0x09128000" />
+        <register type="NOA" address="0x00009888" value="0x0B128000" />
+        <register type="NOA" address="0x00009888" value="0x0D128000" />
+        <register type="NOA" address="0x00009888" value="0x47100600" />
+        <register type="NOA" address="0x00009888" value="0x4D100000" />
+        <register type="NOA" address="0x00009888" value="0x4F100606" />
+        <register type="NOA" address="0x00009888" value="0x51100606" />
+        <register type="NOA" address="0x00009888" value="0x53100606" />
+        <register type="NOA" address="0x00009888" value="0x55100006" />
+        <register type="NOA" address="0x00009888" value="0x17100000" />
+        <register type="NOA" address="0x00009888" value="0x31100000" />
+        <register type="NOA" address="0x00009888" value="0x57100000" />
+        <register type="NOA" address="0x00009888" value="0x49100000" />
+        <register type="NOA" address="0x00009888" value="0x4B100000" />
+        <register type="NOA" address="0x00009884" value="0x00000003" />
+        <register type="NOA" address="0x00009888" value="0x65100002" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x42000001" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x0000D920" value="0x00000000" />
+        <register type="OA" address="0x0000D900" value="0x00000000" />
+        <register type="OA" address="0x0000D904" value="0x00800000" />
+        <register type="OA" address="0x0000D910" value="0x00000000" />
+        <register type="OA" address="0x0000D914" value="0x00800000" />
+        <register type="OA" address="0x0000DC40" value="0x00000000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00008003" />
+    </register_config>
+  </set>
+
+  <set name="Gen12LP L3_3"
+       mdapi_supported_apis="VK OGL OCL MEDIA IO"
+       underscore_name="l3_3"
+       hw_config_guid="9c2cd379-bf93-4ded-b481-f64efd534c4a"
+       chipset="TGL"
+       symbol_name="L3_3"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank4 Output Ready"
+             description="The percentage of time in which slice0 L3 bank4 output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ C 4 READ FADD 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank4_output_ready"
+             units="percent"
+             symbol_name="L30Bank4OutputReady"
+             availability="$SliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Slice0 L3 Bank0 Output Ready"
+             description="The percentage of time in which slice0 L3 bank0 output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ C 6 READ FADD 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank0_output_ready"
+             units="percent"
+             symbol_name="L30Bank0OutputReady"
+             availability="$SliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="EU FPU And EM Pipes Active"
+             description="The percentage of time in which EU FPU and EM pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_em_active"
+             units="percent"
+             symbol_name="EuFpuEmActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO MEDIA"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="EU Thread Occupancy"
+             description="The percentage of time in which hardware threads occupied EUs."
+             data_type="float"
+             max_equation="100"
+             equation="8 A 10 READ FMUL $EuThreadsCount FDIV $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_thread_occupancy"
+             units="percent"
+             symbol_name="EuThreadOccupancy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009840" value="0x00000000" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x04020200" />
+        <register type="NOA" address="0x00009888" value="0x06020020" />
+        <register type="NOA" address="0x00009888" value="0x04000200" />
+        <register type="NOA" address="0x00009888" value="0x06000000" />
+        <register type="NOA" address="0x00009888" value="0x08020028" />
+        <register type="NOA" address="0x00009888" value="0x2E020000" />
+        <register type="NOA" address="0x00009888" value="0x06034000" />
+        <register type="NOA" address="0x00009888" value="0x08034000" />
+        <register type="NOA" address="0x00009888" value="0x0A000020" />
+        <register type="NOA" address="0x00009888" value="0x0C000028" />
+        <register type="NOA" address="0x00009888" value="0x36000000" />
+        <register type="NOA" address="0x00009888" value="0x1E006000" />
+        <register type="NOA" address="0x00009888" value="0x34000300" />
+        <register type="NOA" address="0x00009888" value="0x060A8000" />
+        <register type="NOA" address="0x00009888" value="0x080A8000" />
+        <register type="NOA" address="0x00009884" value="0x00000003" />
+        <register type="NOA" address="0x00009888" value="0x5B100550" />
+        <register type="NOA" address="0x00009888" value="0x17148000" />
+        <register type="NOA" address="0x00009888" value="0x1B141C00" />
+        <register type="NOA" address="0x00009888" value="0x5F110550" />
+        <register type="NOA" address="0x00009888" value="0x07128000" />
+        <register type="NOA" address="0x00009888" value="0x09128000" />
+        <register type="NOA" address="0x00009888" value="0x0B128000" />
+        <register type="NOA" address="0x00009888" value="0x0D128000" />
+        <register type="NOA" address="0x00009888" value="0x17100000" />
+        <register type="NOA" address="0x00009888" value="0x49100000" />
+        <register type="NOA" address="0x00009888" value="0x4B100000" />
+        <register type="NOA" address="0x00009888" value="0x4D100606" />
+        <register type="NOA" address="0x00009888" value="0x31100000" />
+        <register type="NOA" address="0x00009884" value="0x00000003" />
+        <register type="NOA" address="0x00009888" value="0x65100002" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x42000001" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x0000D920" value="0x00000000" />
+        <register type="OA" address="0x0000D900" value="0x00000000" />
+        <register type="OA" address="0x0000D904" value="0x00800000" />
+        <register type="OA" address="0x0000D910" value="0x00000000" />
+        <register type="OA" address="0x0000D914" value="0x00800000" />
+        <register type="OA" address="0x0000DC40" value="0x00000000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00008003" />
+    </register_config>
+  </set>
+
+  <set name="Gen12LP L3_4"
+       mdapi_supported_apis="VK OGL OCL MEDIA IO"
+       underscore_name="l3_4"
+       hw_config_guid="6a68185d-0056-4891-a5f6-29aa1e1d81ae"
+       chipset="TGL"
+       symbol_name="L3_4"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank1 Output Ready"
+             description="The percentage of time in which slice0 L3 bank1 output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ C 4 READ FADD 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank1_output_ready"
+             units="percent"
+             symbol_name="L30Bank1OutputReady"
+             availability="$SliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="EU FPU And EM Pipes Active"
+             description="The percentage of time in which EU FPU and EM pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_em_active"
+             units="percent"
+             symbol_name="EuFpuEmActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO MEDIA"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="EU Thread Occupancy"
+             description="The percentage of time in which hardware threads occupied EUs."
+             data_type="float"
+             max_equation="100"
+             equation="8 A 10 READ FMUL $EuThreadsCount FDIV $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_thread_occupancy"
+             units="percent"
+             symbol_name="EuThreadOccupancy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank5 Output Ready"
+             description="The percentage of time in which slice0 L3 bank5 output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ C 6 READ FADD 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank5_output_ready"
+             units="percent"
+             symbol_name="L30Bank5OutputReady"
+             availability="$SliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009840" value="0x00000000" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x04020A00" />
+        <register type="NOA" address="0x00009888" value="0x06020800" />
+        <register type="NOA" address="0x00009888" value="0x04000A00" />
+        <register type="NOA" address="0x00009888" value="0x06000820" />
+        <register type="NOA" address="0x00009888" value="0x0A020020" />
+        <register type="NOA" address="0x00009888" value="0x0C020028" />
+        <register type="NOA" address="0x00009888" value="0x2E020000" />
+        <register type="NOA" address="0x00009888" value="0x0A034000" />
+        <register type="NOA" address="0x00009888" value="0x18032000" />
+        <register type="NOA" address="0x00009888" value="0x08000028" />
+        <register type="NOA" address="0x00009888" value="0x36000003" />
+        <register type="NOA" address="0x00009888" value="0x1E000000" />
+        <register type="NOA" address="0x00009888" value="0x34001800" />
+        <register type="NOA" address="0x00009888" value="0x0A0A8000" />
+        <register type="NOA" address="0x00009888" value="0x0C0A8000" />
+        <register type="NOA" address="0x00009884" value="0x00000003" />
+        <register type="NOA" address="0x00009888" value="0x5B100550" />
+        <register type="NOA" address="0x00009888" value="0x17148000" />
+        <register type="NOA" address="0x00009888" value="0x1B141C00" />
+        <register type="NOA" address="0x00009888" value="0x5F110550" />
+        <register type="NOA" address="0x00009888" value="0x07128000" />
+        <register type="NOA" address="0x00009888" value="0x09128000" />
+        <register type="NOA" address="0x00009888" value="0x0B128000" />
+        <register type="NOA" address="0x00009888" value="0x0D128000" />
+        <register type="NOA" address="0x00009888" value="0x17100000" />
+        <register type="NOA" address="0x00009888" value="0x49100000" />
+        <register type="NOA" address="0x00009888" value="0x4B100606" />
+        <register type="NOA" address="0x00009888" value="0x4D100000" />
+        <register type="NOA" address="0x00009888" value="0x31100000" />
+        <register type="NOA" address="0x00009884" value="0x00000003" />
+        <register type="NOA" address="0x00009888" value="0x65100002" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x42000001" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x0000D920" value="0x00000000" />
+        <register type="OA" address="0x0000D900" value="0x00000000" />
+        <register type="OA" address="0x0000D904" value="0x00800000" />
+        <register type="OA" address="0x0000D910" value="0x00000000" />
+        <register type="OA" address="0x0000D914" value="0x00800000" />
+        <register type="OA" address="0x0000DC40" value="0x00000000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00008003" />
+    </register_config>
+  </set>
+
+  <set name="Gen12LP L3_5"
+       mdapi_supported_apis="VK OGL OCL MEDIA IO"
+       underscore_name="l3_5"
+       hw_config_guid="3f17a326-ae8b-4869-9f5a-3bccf793e287"
+       chipset="TGL"
+       symbol_name="L3_5"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank6 Output Ready"
+             description="The percentage of time in which slice0 L3 bank6 output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ C 6 READ FADD 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank6_output_ready"
+             units="percent"
+             symbol_name="L30Bank6OutputReady"
+             availability="$SliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="EU FPU And EM Pipes Active"
+             description="The percentage of time in which EU FPU and EM pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_em_active"
+             units="percent"
+             symbol_name="EuFpuEmActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO MEDIA"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="EU Thread Occupancy"
+             description="The percentage of time in which hardware threads occupied EUs."
+             data_type="float"
+             max_equation="100"
+             equation="8 A 10 READ FMUL $EuThreadsCount FDIV $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_thread_occupancy"
+             units="percent"
+             symbol_name="EuThreadOccupancy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank2 Output Ready"
+             description="The percentage of time in which slice0 L3 bank2 output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ C 4 READ FADD 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank2_output_ready"
+             units="percent"
+             symbol_name="L30Bank2OutputReady"
+             availability="$SliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009840" value="0x00000000" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x04021200" />
+        <register type="NOA" address="0x00009888" value="0x06021000" />
+        <register type="NOA" address="0x00009888" value="0x04001200" />
+        <register type="NOA" address="0x00009888" value="0x06001020" />
+        <register type="NOA" address="0x00009888" value="0x0A020020" />
+        <register type="NOA" address="0x00009888" value="0x0C020028" />
+        <register type="NOA" address="0x00009888" value="0x2E020000" />
+        <register type="NOA" address="0x00009888" value="0x0A034000" />
+        <register type="NOA" address="0x00009888" value="0x18032000" />
+        <register type="NOA" address="0x00009888" value="0x08000028" />
+        <register type="NOA" address="0x00009888" value="0x36000003" />
+        <register type="NOA" address="0x00009888" value="0x1E000000" />
+        <register type="NOA" address="0x00009888" value="0x34001800" />
+        <register type="NOA" address="0x00009888" value="0x0A0A8000" />
+        <register type="NOA" address="0x00009888" value="0x0C0A8000" />
+        <register type="NOA" address="0x00009884" value="0x00000003" />
+        <register type="NOA" address="0x00009888" value="0x5B100550" />
+        <register type="NOA" address="0x00009888" value="0x17148000" />
+        <register type="NOA" address="0x00009888" value="0x1B141C00" />
+        <register type="NOA" address="0x00009888" value="0x5F110550" />
+        <register type="NOA" address="0x00009888" value="0x07128000" />
+        <register type="NOA" address="0x00009888" value="0x09128000" />
+        <register type="NOA" address="0x00009888" value="0x0B128000" />
+        <register type="NOA" address="0x00009888" value="0x0D128000" />
+        <register type="NOA" address="0x00009888" value="0x17100000" />
+        <register type="NOA" address="0x00009888" value="0x49100000" />
+        <register type="NOA" address="0x00009888" value="0x4B100606" />
+        <register type="NOA" address="0x00009888" value="0x4D100000" />
+        <register type="NOA" address="0x00009888" value="0x31100000" />
+        <register type="NOA" address="0x00009884" value="0x00000003" />
+        <register type="NOA" address="0x00009888" value="0x65100002" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x42000001" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x0000D920" value="0x00000000" />
+        <register type="OA" address="0x0000D900" value="0x00000000" />
+        <register type="OA" address="0x0000D904" value="0x00800000" />
+        <register type="OA" address="0x0000D910" value="0x00000000" />
+        <register type="OA" address="0x0000D914" value="0x00800000" />
+        <register type="OA" address="0x0000DC40" value="0x00000000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00008003" />
+    </register_config>
+  </set>
+
+  <set name="Gen12LP L3_6"
+       mdapi_supported_apis="VK OGL OCL MEDIA IO"
+       underscore_name="l3_6"
+       hw_config_guid="d312c40a-9fb7-489a-9a1a-9cd80aac6d61"
+       chipset="TGL"
+       symbol_name="L3_6"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank7 Output Ready"
+             description="The percentage of time in which slice0 L3 bank7 output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ C 6 READ FADD 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank7_output_ready"
+             units="percent"
+             symbol_name="L30Bank7OutputReady"
+             availability="$SliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="EU FPU And EM Pipes Active"
+             description="The percentage of time in which EU FPU and EM pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_em_active"
+             units="percent"
+             symbol_name="EuFpuEmActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO MEDIA"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="EU Thread Occupancy"
+             description="The percentage of time in which hardware threads occupied EUs."
+             data_type="float"
+             max_equation="100"
+             equation="8 A 10 READ FMUL $EuThreadsCount FDIV $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_thread_occupancy"
+             units="percent"
+             symbol_name="EuThreadOccupancy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank3 Output Ready"
+             description="The percentage of time in which slice0 L3 bank3 output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ C 4 READ FADD 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank3_output_ready"
+             units="percent"
+             symbol_name="L30Bank3OutputReady"
+             availability="$SliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009840" value="0x00000000" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x04021A00" />
+        <register type="NOA" address="0x00009888" value="0x06021800" />
+        <register type="NOA" address="0x00009888" value="0x04001A00" />
+        <register type="NOA" address="0x00009888" value="0x06001820" />
+        <register type="NOA" address="0x00009888" value="0x0A020020" />
+        <register type="NOA" address="0x00009888" value="0x0C020028" />
+        <register type="NOA" address="0x00009888" value="0x2E020000" />
+        <register type="NOA" address="0x00009888" value="0x0A034000" />
+        <register type="NOA" address="0x00009888" value="0x18032000" />
+        <register type="NOA" address="0x00009888" value="0x08000028" />
+        <register type="NOA" address="0x00009888" value="0x36000003" />
+        <register type="NOA" address="0x00009888" value="0x1E000000" />
+        <register type="NOA" address="0x00009888" value="0x34001800" />
+        <register type="NOA" address="0x00009888" value="0x0A0A8000" />
+        <register type="NOA" address="0x00009888" value="0x0C0A8000" />
+        <register type="NOA" address="0x00009884" value="0x00000003" />
+        <register type="NOA" address="0x00009888" value="0x5B100550" />
+        <register type="NOA" address="0x00009888" value="0x17148000" />
+        <register type="NOA" address="0x00009888" value="0x1B141C00" />
+        <register type="NOA" address="0x00009888" value="0x5F110550" />
+        <register type="NOA" address="0x00009888" value="0x07128000" />
+        <register type="NOA" address="0x00009888" value="0x09128000" />
+        <register type="NOA" address="0x00009888" value="0x0B128000" />
+        <register type="NOA" address="0x00009888" value="0x0D128000" />
+        <register type="NOA" address="0x00009888" value="0x17100000" />
+        <register type="NOA" address="0x00009888" value="0x49100000" />
+        <register type="NOA" address="0x00009888" value="0x4B100606" />
+        <register type="NOA" address="0x00009888" value="0x4D100000" />
+        <register type="NOA" address="0x00009888" value="0x31100000" />
+        <register type="NOA" address="0x00009884" value="0x00000003" />
+        <register type="NOA" address="0x00009888" value="0x65100002" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x42000001" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x0000D920" value="0x00000000" />
+        <register type="OA" address="0x0000D900" value="0x00000000" />
+        <register type="OA" address="0x0000D904" value="0x00800000" />
+        <register type="OA" address="0x0000D910" value="0x00000000" />
+        <register type="OA" address="0x0000D914" value="0x00800000" />
+        <register type="OA" address="0x0000DC40" value="0x00000000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00008003" />
+    </register_config>
+  </set>
+
+  <set name="Sampler_1"
+       mdapi_supported_apis="VK OGL OCL MEDIA IO"
+       underscore_name="sampler_1"
+       hw_config_guid="f0f255a4-535c-43ed-9d6b-85958cef6c1c"
+       chipset="TGL"
+       symbol_name="Sampler_1"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 DualSubslice1 Input Available"
+             description="The percentage of time in which slice0 dualsubslice1 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler01_input_available"
+             units="percent"
+             symbol_name="Sampler01InputAvailable"
+             availability="$DualSubsliceMask 2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="dualsubslice"
+             />
+    <counter name="Slice0 DualSubslice2 Input Available"
+             description="The percentage of time in which slice0 dualsubslice2 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler02_input_available"
+             units="percent"
+             symbol_name="Sampler02InputAvailable"
+             availability="$DualSubsliceMask 4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="dualsubslice"
+             />
+    <counter name="EU FPU And EM Pipes Active"
+             description="The percentage of time in which EU FPU and EM pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_em_active"
+             units="percent"
+             symbol_name="EuFpuEmActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 DualSubslice3 Input Available"
+             description="The percentage of time in which slice0 dualsubslice3 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler03_input_available"
+             units="percent"
+             symbol_name="Sampler03InputAvailable"
+             availability="$DualSubsliceMask 8 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="dualsubslice"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO MEDIA"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="EU Thread Occupancy"
+             description="The percentage of time in which hardware threads occupied EUs."
+             data_type="float"
+             max_equation="100"
+             equation="8 A 10 READ FMUL $EuThreadsCount FDIV $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_thread_occupancy"
+             units="percent"
+             symbol_name="EuThreadOccupancy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 DualSubslice4 Input Available"
+             description="The percentage of time in which slice0 dualsubslice4 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler04_input_available"
+             units="percent"
+             symbol_name="Sampler04InputAvailable"
+             availability="$DualSubsliceMask 16 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="dualsubslice"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Slice0 DualSubslice5 Input Available"
+             description="The percentage of time in which slice0 dualsubslice5 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler05_input_available"
+             units="percent"
+             symbol_name="Sampler05InputAvailable"
+             availability="$DualSubsliceMask 32 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="dualsubslice"
+             />
+    <counter name="Slice0 DualSubslice0 Input Available"
+             description="The percentage of time in which slice0 dualsubslice0 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler00_input_available"
+             units="percent"
+             symbol_name="Sampler00InputAvailable"
+             availability="$DualSubsliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="dualsubslice"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009840" value="0x00000000" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x1C121600" />
+        <register type="NOA" address="0x00009888" value="0x18141600" />
+        <register type="NOA" address="0x00009888" value="0x1C325600" />
+        <register type="NOA" address="0x00009888" value="0x18341600" />
+        <register type="NOA" address="0x00009888" value="0x1C521600" />
+        <register type="NOA" address="0x00009888" value="0x185416A6" />
+        <register type="NOA" address="0x00009888" value="0x1C721600" />
+        <register type="NOA" address="0x00009888" value="0x18741600" />
+        <register type="NOA" address="0x00009888" value="0x1C921600" />
+        <register type="NOA" address="0x00009888" value="0x18941600" />
+        <register type="NOA" address="0x00009888" value="0x1CB21600" />
+        <register type="NOA" address="0x00009888" value="0x18B41600" />
+        <register type="NOA" address="0x00009888" value="0x1C07C000" />
+        <register type="NOA" address="0x00009888" value="0x2407002B" />
+        <register type="NOA" address="0x00009888" value="0x04120086" />
+        <register type="NOA" address="0x00009888" value="0x20120000" />
+        <register type="NOA" address="0x00009888" value="0x02124000" />
+        <register type="NOA" address="0x00009888" value="0x12138000" />
+        <register type="NOA" address="0x00009888" value="0x14138000" />
+        <register type="NOA" address="0x00009888" value="0x021400A6" />
+        <register type="NOA" address="0x00009888" value="0x10140000" />
+        <register type="NOA" address="0x00009888" value="0x00140000" />
+        <register type="NOA" address="0x00009888" value="0x1A150020" />
+        <register type="NOA" address="0x00009888" value="0x1E320086" />
+        <register type="NOA" address="0x00009888" value="0x20320000" />
+        <register type="NOA" address="0x00009888" value="0x1E330003" />
+        <register type="NOA" address="0x00009888" value="0x1C3400A6" />
+        <register type="NOA" address="0x00009888" value="0x10340000" />
+        <register type="NOA" address="0x00009888" value="0x0E340000" />
+        <register type="NOA" address="0x00009888" value="0x1C358000" />
+        <register type="NOA" address="0x00009888" value="0x1A520086" />
+        <register type="NOA" address="0x00009888" value="0x20520000" />
+        <register type="NOA" address="0x00009888" value="0x18524000" />
+        <register type="NOA" address="0x00009888" value="0x1C53C000" />
+        <register type="NOA" address="0x00009888" value="0x10540000" />
+        <register type="NOA" address="0x00009888" value="0x0C540000" />
+        <register type="NOA" address="0x00009888" value="0x1C550800" />
+        <register type="NOA" address="0x00009888" value="0x16720086" />
+        <register type="NOA" address="0x00009888" value="0x20720000" />
+        <register type="NOA" address="0x00009888" value="0x14724000" />
+        <register type="NOA" address="0x00009888" value="0x1C733000" />
+        <register type="NOA" address="0x00009888" value="0x147400A6" />
+        <register type="NOA" address="0x00009888" value="0x10740000" />
+        <register type="NOA" address="0x00009888" value="0x0A740000" />
+        <register type="NOA" address="0x00009888" value="0x1C750080" />
+        <register type="NOA" address="0x00009888" value="0x12920086" />
+        <register type="NOA" address="0x00009888" value="0x20920000" />
+        <register type="NOA" address="0x00009888" value="0x10924000" />
+        <register type="NOA" address="0x00009888" value="0x1C930C00" />
+        <register type="NOA" address="0x00009888" value="0x109400A6" />
+        <register type="NOA" address="0x00009888" value="0x08940000" />
+        <register type="NOA" address="0x00009888" value="0x1C950008" />
+        <register type="NOA" address="0x00009888" value="0x0EB20086" />
+        <register type="NOA" address="0x00009888" value="0x20B20000" />
+        <register type="NOA" address="0x00009888" value="0x00B24000" />
+        <register type="NOA" address="0x00009888" value="0x10B38000" />
+        <register type="NOA" address="0x00009888" value="0x1CB30200" />
+        <register type="NOA" address="0x00009888" value="0x00B400A6" />
+        <register type="NOA" address="0x00009888" value="0x10B40000" />
+        <register type="NOA" address="0x00009888" value="0x18B58000" />
+        <register type="NOA" address="0x00009888" value="0x1E0F0028" />
+        <register type="NOA" address="0x00009888" value="0x14104000" />
+        <register type="NOA" address="0x00009888" value="0x16104000" />
+        <register type="NOA" address="0x00009888" value="0x2C024000" />
+        <register type="NOA" address="0x00009888" value="0x2E020001" />
+        <register type="NOA" address="0x00009888" value="0x2A03A500" />
+        <register type="NOA" address="0x00009888" value="0x18002000" />
+        <register type="NOA" address="0x00009888" value="0x36003248" />
+        <register type="NOA" address="0x00009888" value="0x380024DB" />
+        <register type="NOA" address="0x00009888" value="0x1A004000" />
+        <register type="NOA" address="0x00009888" value="0x1C004000" />
+        <register type="NOA" address="0x00009888" value="0x00014000" />
+        <register type="NOA" address="0x00009888" value="0x1A012000" />
+        <register type="NOA" address="0x00009888" value="0x1C012000" />
+        <register type="NOA" address="0x00009888" value="0x1E012000" />
+        <register type="NOA" address="0x00009888" value="0x2405C000" />
+        <register type="NOA" address="0x00009888" value="0x26050003" />
+        <register type="NOA" address="0x00009888" value="0x220500A0" />
+        <register type="NOA" address="0x00009888" value="0x24062800" />
+        <register type="NOA" address="0x00009888" value="0x140A8000" />
+        <register type="NOA" address="0x00009888" value="0x160A8000" />
+        <register type="NOA" address="0x00009888" value="0x180A8000" />
+        <register type="NOA" address="0x00009888" value="0x1A0A8000" />
+        <register type="NOA" address="0x00009884" value="0x00000003" />
+        <register type="NOA" address="0x00009888" value="0x41104000" />
+        <register type="NOA" address="0x00009888" value="0x5B105005" />
+        <register type="NOA" address="0x00009888" value="0x5D101555" />
+        <register type="NOA" address="0x00009888" value="0x11148000" />
+        <register type="NOA" address="0x00009888" value="0x1B14E000" />
+        <register type="NOA" address="0x00009888" value="0x1D14003F" />
+        <register type="NOA" address="0x00009888" value="0x13148000" />
+        <register type="NOA" address="0x00009888" value="0x15148000" />
+        <register type="NOA" address="0x00009888" value="0x4B112000" />
+        <register type="NOA" address="0x00009888" value="0x5F115005" />
+        <register type="NOA" address="0x00009888" value="0x61111555" />
+        <register type="NOA" address="0x00009888" value="0x01128000" />
+        <register type="NOA" address="0x00009888" value="0x0F128000" />
+        <register type="NOA" address="0x00009888" value="0x11128000" />
+        <register type="NOA" address="0x00009888" value="0x13128000" />
+        <register type="NOA" address="0x00009888" value="0x15128000" />
+        <register type="NOA" address="0x00009888" value="0x17128000" />
+        <register type="NOA" address="0x00009888" value="0x19128000" />
+        <register type="NOA" address="0x00009888" value="0x1B128000" />
+        <register type="NOA" address="0x00009888" value="0x1D128000" />
+        <register type="NOA" address="0x00009888" value="0x1F128000" />
+        <register type="NOA" address="0x00009888" value="0x03128000" />
+        <register type="NOA" address="0x00009888" value="0x05128000" />
+        <register type="NOA" address="0x00009888" value="0x47101600" />
+        <register type="NOA" address="0x00009888" value="0x4D101000" />
+        <register type="NOA" address="0x00009888" value="0x4F101603" />
+        <register type="NOA" address="0x00009888" value="0x51100003" />
+        <register type="NOA" address="0x00009888" value="0x53101404" />
+        <register type="NOA" address="0x00009888" value="0x55101111" />
+        <register type="NOA" address="0x00009888" value="0x17100000" />
+        <register type="NOA" address="0x00009888" value="0x31100000" />
+        <register type="NOA" address="0x00009888" value="0x57100005" />
+        <register type="NOA" address="0x00009888" value="0x49100511" />
+        <register type="NOA" address="0x00009884" value="0x00000003" />
+        <register type="NOA" address="0x00009888" value="0x65100002" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x42000001" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x0000D920" value="0x00000000" />
+        <register type="OA" address="0x0000D900" value="0x00000000" />
+        <register type="OA" address="0x0000D904" value="0xF0800000" />
+        <register type="OA" address="0x0000D910" value="0x00000000" />
+        <register type="OA" address="0x0000D914" value="0x30800000" />
+        <register type="OA" address="0x0000DC40" value="0x003F0000" />
+        <register type="OA" address="0x0000D940" value="0x00000018" />
+        <register type="OA" address="0x0000D944" value="0x0000FFFC" />
+        <register type="OA" address="0x0000DC00" value="0x00000018" />
+        <register type="OA" address="0x0000DC04" value="0x0000FFFC" />
+        <register type="OA" address="0x0000D948" value="0x00000060" />
+        <register type="OA" address="0x0000D94C" value="0x0000FFF3" />
+        <register type="OA" address="0x0000DC08" value="0x00000060" />
+        <register type="OA" address="0x0000DC0C" value="0x0000FFF3" />
+        <register type="OA" address="0x0000D950" value="0x00000180" />
+        <register type="OA" address="0x0000D954" value="0x0000FFCF" />
+        <register type="OA" address="0x0000DC10" value="0x00000180" />
+        <register type="OA" address="0x0000DC14" value="0x0000FFCF" />
+        <register type="OA" address="0x0000D958" value="0x00000600" />
+        <register type="OA" address="0x0000D95C" value="0x0000FF3F" />
+        <register type="OA" address="0x0000DC18" value="0x00000600" />
+        <register type="OA" address="0x0000DC1C" value="0x0000FF3F" />
+        <register type="OA" address="0x0000D960" value="0x00001800" />
+        <register type="OA" address="0x0000D964" value="0x0000FCFF" />
+        <register type="OA" address="0x0000DC20" value="0x00001800" />
+        <register type="OA" address="0x0000DC24" value="0x0000FCFF" />
+        <register type="OA" address="0x0000D968" value="0x00006000" />
+        <register type="OA" address="0x0000D96C" value="0x0000F3FF" />
+        <register type="OA" address="0x0000DC28" value="0x00006000" />
+        <register type="OA" address="0x0000DC2C" value="0x0000F3FF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00008003" />
+    </register_config>
+  </set>
+
+  <set name="Sampler_2"
+       mdapi_supported_apis="VK OGL OCL MEDIA IO"
+       underscore_name="sampler_2"
+       hw_config_guid="f47c6b97-fc10-4962-bb67-d623e9d6219b"
+       chipset="TGL"
+       symbol_name="Sampler_2"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 DualSubslice0 Sampler Output Ready"
+             description="The percentage of time in which slice0 dualsubslice0 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="B 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler00_output_ready"
+             units="percent"
+             symbol_name="Sampler00OutputReady"
+             availability="$DualSubsliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Slice0 DualSubslice1 Sampler Output Ready"
+             description="The percentage of time in which slice0 dualsubslice1 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler01_output_ready"
+             units="percent"
+             symbol_name="Sampler01OutputReady"
+             availability="$DualSubsliceMask 2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="EU FPU And EM Pipes Active"
+             description="The percentage of time in which EU FPU and EM pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_em_active"
+             units="percent"
+             symbol_name="EuFpuEmActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 DualSubslice2 Sampler Output Ready"
+             description="The percentage of time in which slice0 dualsubslice2 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler02_output_ready"
+             units="percent"
+             symbol_name="Sampler02OutputReady"
+             availability="$DualSubsliceMask 4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO MEDIA"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="EU Thread Occupancy"
+             description="The percentage of time in which hardware threads occupied EUs."
+             data_type="float"
+             max_equation="100"
+             equation="8 A 10 READ FMUL $EuThreadsCount FDIV $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_thread_occupancy"
+             units="percent"
+             symbol_name="EuThreadOccupancy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 DualSubslice3 Sampler Output Ready"
+             description="The percentage of time in which slice0 dualsubslice3 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler03_output_ready"
+             units="percent"
+             symbol_name="Sampler03OutputReady"
+             availability="$DualSubsliceMask 8 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Slice0 DualSubslice4 Sampler Output Ready"
+             description="The percentage of time in which slice0 dualsubslice4 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler04_output_ready"
+             units="percent"
+             symbol_name="Sampler04OutputReady"
+             availability="$DualSubsliceMask 16 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Slice0 DualSubslice5 Sampler Output Ready"
+             description="The percentage of time in which slice0 dualsubslice5 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler05_output_ready"
+             units="percent"
+             symbol_name="Sampler05OutputReady"
+             availability="$DualSubsliceMask 32 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009840" value="0x00000000" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x0C123E00" />
+        <register type="NOA" address="0x00009888" value="0x04143E00" />
+        <register type="NOA" address="0x00009888" value="0x0C323E00" />
+        <register type="NOA" address="0x00009888" value="0x04343E00" />
+        <register type="NOA" address="0x00009888" value="0x0C523E00" />
+        <register type="NOA" address="0x00009888" value="0x04543E00" />
+        <register type="NOA" address="0x00009888" value="0x0C723E00" />
+        <register type="NOA" address="0x00009888" value="0x04743E00" />
+        <register type="NOA" address="0x00009888" value="0x0C923E00" />
+        <register type="NOA" address="0x00009888" value="0x04943E00" />
+        <register type="NOA" address="0x00009888" value="0x0CB23E00" />
+        <register type="NOA" address="0x00009888" value="0x04B43E00" />
+        <register type="NOA" address="0x00009888" value="0x1C07C000" />
+        <register type="NOA" address="0x00009888" value="0x2407002B" />
+        <register type="NOA" address="0x00009888" value="0x04120033" />
+        <register type="NOA" address="0x00009888" value="0x20120000" />
+        <register type="NOA" address="0x00009888" value="0x02124000" />
+        <register type="NOA" address="0x00009888" value="0x12138000" />
+        <register type="NOA" address="0x00009888" value="0x14138000" />
+        <register type="NOA" address="0x00009888" value="0x02140013" />
+        <register type="NOA" address="0x00009888" value="0x10140000" />
+        <register type="NOA" address="0x00009888" value="0x00140000" />
+        <register type="NOA" address="0x00009888" value="0x1A150020" />
+        <register type="NOA" address="0x00009888" value="0x1E320033" />
+        <register type="NOA" address="0x00009888" value="0x20320000" />
+        <register type="NOA" address="0x00009888" value="0x1C324000" />
+        <register type="NOA" address="0x00009888" value="0x1E330003" />
+        <register type="NOA" address="0x00009888" value="0x1C340013" />
+        <register type="NOA" address="0x00009888" value="0x10340000" />
+        <register type="NOA" address="0x00009888" value="0x0E340000" />
+        <register type="NOA" address="0x00009888" value="0x1C358000" />
+        <register type="NOA" address="0x00009888" value="0x1A520033" />
+        <register type="NOA" address="0x00009888" value="0x20520000" />
+        <register type="NOA" address="0x00009888" value="0x18524000" />
+        <register type="NOA" address="0x00009888" value="0x1C53C000" />
+        <register type="NOA" address="0x00009888" value="0x18540013" />
+        <register type="NOA" address="0x00009888" value="0x10540000" />
+        <register type="NOA" address="0x00009888" value="0x0C540000" />
+        <register type="NOA" address="0x00009888" value="0x1C550800" />
+        <register type="NOA" address="0x00009888" value="0x16720033" />
+        <register type="NOA" address="0x00009888" value="0x20720000" />
+        <register type="NOA" address="0x00009888" value="0x14724000" />
+        <register type="NOA" address="0x00009888" value="0x1C733000" />
+        <register type="NOA" address="0x00009888" value="0x14740013" />
+        <register type="NOA" address="0x00009888" value="0x10740000" />
+        <register type="NOA" address="0x00009888" value="0x0A740000" />
+        <register type="NOA" address="0x00009888" value="0x1C750080" />
+        <register type="NOA" address="0x00009888" value="0x12920033" />
+        <register type="NOA" address="0x00009888" value="0x20920000" />
+        <register type="NOA" address="0x00009888" value="0x10924000" />
+        <register type="NOA" address="0x00009888" value="0x1C930C00" />
+        <register type="NOA" address="0x00009888" value="0x10940013" />
+        <register type="NOA" address="0x00009888" value="0x08940000" />
+        <register type="NOA" address="0x00009888" value="0x1C950008" />
+        <register type="NOA" address="0x00009888" value="0x0EB20033" />
+        <register type="NOA" address="0x00009888" value="0x20B20000" />
+        <register type="NOA" address="0x00009888" value="0x00B24000" />
+        <register type="NOA" address="0x00009888" value="0x10B38000" />
+        <register type="NOA" address="0x00009888" value="0x1CB30200" />
+        <register type="NOA" address="0x00009888" value="0x00B40013" />
+        <register type="NOA" address="0x00009888" value="0x10B40000" />
+        <register type="NOA" address="0x00009888" value="0x18B58000" />
+        <register type="NOA" address="0x00009888" value="0x1E0F0028" />
+        <register type="NOA" address="0x00009888" value="0x14104000" />
+        <register type="NOA" address="0x00009888" value="0x16104000" />
+        <register type="NOA" address="0x00009888" value="0x2C024000" />
+        <register type="NOA" address="0x00009888" value="0x2E020001" />
+        <register type="NOA" address="0x00009888" value="0x2A03A500" />
+        <register type="NOA" address="0x00009888" value="0x18002000" />
+        <register type="NOA" address="0x00009888" value="0x36003248" />
+        <register type="NOA" address="0x00009888" value="0x380024DB" />
+        <register type="NOA" address="0x00009888" value="0x1A004000" />
+        <register type="NOA" address="0x00009888" value="0x1C004000" />
+        <register type="NOA" address="0x00009888" value="0x00014000" />
+        <register type="NOA" address="0x00009888" value="0x1A012000" />
+        <register type="NOA" address="0x00009888" value="0x1C012000" />
+        <register type="NOA" address="0x00009888" value="0x1E012000" />
+        <register type="NOA" address="0x00009888" value="0x2405C000" />
+        <register type="NOA" address="0x00009888" value="0x26050003" />
+        <register type="NOA" address="0x00009888" value="0x220500A0" />
+        <register type="NOA" address="0x00009888" value="0x24062800" />
+        <register type="NOA" address="0x00009888" value="0x140A8000" />
+        <register type="NOA" address="0x00009888" value="0x160A8000" />
+        <register type="NOA" address="0x00009888" value="0x180A8000" />
+        <register type="NOA" address="0x00009888" value="0x1A0A8000" />
+        <register type="NOA" address="0x00009884" value="0x00000003" />
+        <register type="NOA" address="0x00009888" value="0x41104000" />
+        <register type="NOA" address="0x00009888" value="0x5B105005" />
+        <register type="NOA" address="0x00009888" value="0x5D101555" />
+        <register type="NOA" address="0x00009888" value="0x11148000" />
+        <register type="NOA" address="0x00009888" value="0x1B14E000" />
+        <register type="NOA" address="0x00009888" value="0x1D14003F" />
+        <register type="NOA" address="0x00009888" value="0x13148000" />
+        <register type="NOA" address="0x00009888" value="0x15148000" />
+        <register type="NOA" address="0x00009888" value="0x4B112000" />
+        <register type="NOA" address="0x00009888" value="0x5F115005" />
+        <register type="NOA" address="0x00009888" value="0x61111555" />
+        <register type="NOA" address="0x00009888" value="0x01128000" />
+        <register type="NOA" address="0x00009888" value="0x0F128000" />
+        <register type="NOA" address="0x00009888" value="0x11128000" />
+        <register type="NOA" address="0x00009888" value="0x13128000" />
+        <register type="NOA" address="0x00009888" value="0x15128000" />
+        <register type="NOA" address="0x00009888" value="0x17128000" />
+        <register type="NOA" address="0x00009888" value="0x19128000" />
+        <register type="NOA" address="0x00009888" value="0x1B128000" />
+        <register type="NOA" address="0x00009888" value="0x1D128000" />
+        <register type="NOA" address="0x00009888" value="0x1F128000" />
+        <register type="NOA" address="0x00009888" value="0x03128000" />
+        <register type="NOA" address="0x00009888" value="0x05128000" />
+        <register type="NOA" address="0x00009888" value="0x47101600" />
+        <register type="NOA" address="0x00009888" value="0x4D101000" />
+        <register type="NOA" address="0x00009888" value="0x4F101603" />
+        <register type="NOA" address="0x00009888" value="0x51100003" />
+        <register type="NOA" address="0x00009888" value="0x53101404" />
+        <register type="NOA" address="0x00009888" value="0x55101111" />
+        <register type="NOA" address="0x00009888" value="0x17100000" />
+        <register type="NOA" address="0x00009888" value="0x31100000" />
+        <register type="NOA" address="0x00009888" value="0x57100005" />
+        <register type="NOA" address="0x00009888" value="0x49100511" />
+        <register type="NOA" address="0x00009884" value="0x00000003" />
+        <register type="NOA" address="0x00009888" value="0x65100002" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x42000001" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x0000D920" value="0x00000000" />
+        <register type="OA" address="0x0000D900" value="0x00000000" />
+        <register type="OA" address="0x0000D904" value="0xF0800000" />
+        <register type="OA" address="0x0000D910" value="0x00000000" />
+        <register type="OA" address="0x0000D914" value="0x30800000" />
+        <register type="OA" address="0x0000DC40" value="0x003F0000" />
+        <register type="OA" address="0x0000D940" value="0x00000018" />
+        <register type="OA" address="0x0000D944" value="0x0000FFFC" />
+        <register type="OA" address="0x0000DC00" value="0x00000018" />
+        <register type="OA" address="0x0000DC04" value="0x0000FFFC" />
+        <register type="OA" address="0x0000D948" value="0x00000060" />
+        <register type="OA" address="0x0000D94C" value="0x0000FFF3" />
+        <register type="OA" address="0x0000DC08" value="0x00000060" />
+        <register type="OA" address="0x0000DC0C" value="0x0000FFF3" />
+        <register type="OA" address="0x0000D950" value="0x00000180" />
+        <register type="OA" address="0x0000D954" value="0x0000FFCF" />
+        <register type="OA" address="0x0000DC10" value="0x00000180" />
+        <register type="OA" address="0x0000DC14" value="0x0000FFCF" />
+        <register type="OA" address="0x0000D958" value="0x00000600" />
+        <register type="OA" address="0x0000D95C" value="0x0000FF3F" />
+        <register type="OA" address="0x0000DC18" value="0x00000600" />
+        <register type="OA" address="0x0000DC1C" value="0x0000FF3F" />
+        <register type="OA" address="0x0000D960" value="0x00001800" />
+        <register type="OA" address="0x0000D964" value="0x0000FCFF" />
+        <register type="OA" address="0x0000DC20" value="0x00001800" />
+        <register type="OA" address="0x0000DC24" value="0x0000FCFF" />
+        <register type="OA" address="0x0000D968" value="0x00006000" />
+        <register type="OA" address="0x0000D96C" value="0x0000F3FF" />
+        <register type="OA" address="0x0000DC28" value="0x00006000" />
+        <register type="OA" address="0x0000DC2C" value="0x0000F3FF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00008003" />
+    </register_config>
+  </set>
+
+  <set name="TDL_1"
+       mdapi_supported_apis="VK OGL OCL MEDIA IO"
+       underscore_name="tdl_1"
+       hw_config_guid="2e49d25e-93e8-4e2b-b91b-51731f5fb315"
+       chipset="TGL"
+       symbol_name="TDL_1"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Thread Header Ready on Slice0 DualSubslice1 Thread Dispatcher"
+             description="The percentage of time in which thread header is ready on slice0 dualsubslice1 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header01_ready"
+             units="percent"
+             symbol_name="ThreadHeader01Ready"
+             availability="$DualSubsliceMask 2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="dualsubslice"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Non-PS Thread Ready For Dispatch on Slice0 DualSubslice2 Thread Dispatcher"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 dualsubslice2 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread02_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread02ReadyForDispatch"
+             availability="$DualSubsliceMask 4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="dualsubslice"
+             />
+    <counter name="Thread Header Ready on Slice0 DualSubslice1 Thread Dispatcher Port 2"
+             description="The percentage of time in which thread header is ready on slice0 dualsubslice1 thread dispatcher port 2"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header01_ready_port2"
+             units="percent"
+             symbol_name="ThreadHeader01ReadyPort2"
+             availability="$DualSubsliceMask 2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="dualsubslice"
+             />
+    <counter name="Thread Header Ready on Slice0 DualSubslice1 Thread Dispatcher Port 3"
+             description="The percentage of time in which thread header is ready on slice0 dualsubslice1 thread dispatcher port 3"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header01_ready_port3"
+             units="percent"
+             symbol_name="ThreadHeader01ReadyPort3"
+             availability="$DualSubsliceMask 2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="dualsubslice"
+             />
+    <counter name="Thread Header Ready on Slice0 DualSubslice1 Thread Dispatcher Port 0"
+             description="The percentage of time in which thread header is ready on slice0 dualsubslice1 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header01_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader01ReadyPort0"
+             availability="$DualSubsliceMask 2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="dualsubslice"
+             />
+    <counter name="Thread Header Ready on Slice0 DualSubslice1 Thread Dispatcher Port 1"
+             description="The percentage of time in which thread header is ready on slice0 dualsubslice1 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header01_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader01ReadyPort1"
+             availability="$DualSubsliceMask 2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="dualsubslice"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Non-PS Thread Ready For Dispatch on Slice0 DualSubslice0 Thread Dispatcher"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 dualsubslice0 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread00_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread00ReadyForDispatch"
+             availability="$DualSubsliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="dualsubslice"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO MEDIA"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="Thread Header Ready on Slice0 DualSubslice0 Thread Dispatcher"
+             description="The percentage of time in which thread header is ready on slice0 dualsubslice0 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header00_ready"
+             units="percent"
+             symbol_name="ThreadHeader00Ready"
+             availability="$DualSubsliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="dualsubslice"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU And EM Pipes Active"
+             description="The percentage of time in which EU FPU and EM pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_em_active"
+             units="percent"
+             symbol_name="EuFpuEmActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="EU Thread Occupancy"
+             description="The percentage of time in which hardware threads occupied EUs."
+             data_type="float"
+             max_equation="100"
+             equation="8 A 10 READ FMUL $EuThreadsCount FDIV $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_thread_occupancy"
+             units="percent"
+             symbol_name="EuThreadOccupancy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Non-PS Thread Ready For Dispatch on Slice0 DualSubslice3 Thread Dispatcher"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 dualsubslice3 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread03_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread03ReadyForDispatch"
+             availability="$DualSubsliceMask 8 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="dualsubslice"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="Non-PS Thread Ready For Dispatch on Slice0 DualSubslice5 Thread Dispatcher"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 dualsubslice5 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread05_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread05ReadyForDispatch"
+             availability="$DualSubsliceMask 32 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="dualsubslice"
+             />
+    <counter name="Non-PS Thread Ready For Dispatch on Slice0 DualSubslice4 Thread Dispatcher"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 dualsubslice4 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread04_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread04ReadyForDispatch"
+             availability="$DualSubsliceMask 16 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="dualsubslice"
+             />
+    <counter name="Non-PS Thread Ready For Dispatch on Slice0 DualSubslice1 Thread Dispatcher"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 dualsubslice1 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread01_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread01ReadyForDispatch"
+             availability="$DualSubsliceMask 2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="dualsubslice"
+             />
+    <counter name="Thread Header Ready on Slice0 DualSubslice0 Thread Dispatcher Port 3"
+             description="The percentage of time in which thread header is ready on slice0 dualsubslice0 thread dispatcher port 3"
+             data_type="float"
+             max_equation="100"
+             equation="C 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header00_ready_port3"
+             units="percent"
+             symbol_name="ThreadHeader00ReadyPort3"
+             availability="$DualSubsliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="dualsubslice"
+             />
+    <counter name="Thread Header Ready on Slice0 DualSubslice0 Thread Dispatcher Port 2"
+             description="The percentage of time in which thread header is ready on slice0 dualsubslice0 thread dispatcher port 2"
+             data_type="float"
+             max_equation="100"
+             equation="C 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header00_ready_port2"
+             units="percent"
+             symbol_name="ThreadHeader00ReadyPort2"
+             availability="$DualSubsliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="dualsubslice"
+             />
+    <counter name="Thread Header Ready on Slice0 DualSubslice0 Thread Dispatcher Port 1"
+             description="The percentage of time in which thread header is ready on slice0 dualsubslice0 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header00_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader00ReadyPort1"
+             availability="$DualSubsliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="dualsubslice"
+             />
+    <counter name="Thread Header Ready on Slice0 DualSubslice0 Thread Dispatcher Port 0"
+             description="The percentage of time in which thread header is ready on slice0 dualsubslice0 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header00_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader00ReadyPort0"
+             availability="$DualSubsliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="dualsubslice"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009840" value="0x00000000" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x2611001C" />
+        <register type="NOA" address="0x00009888" value="0x2631001C" />
+        <register type="NOA" address="0x00009888" value="0x2651001C" />
+        <register type="NOA" address="0x00009888" value="0x2671001C" />
+        <register type="NOA" address="0x00009888" value="0x2691001C" />
+        <register type="NOA" address="0x00009888" value="0x26B1001C" />
+        <register type="NOA" address="0x00009888" value="0x1C07C000" />
+        <register type="NOA" address="0x00009888" value="0x24070002" />
+        <register type="NOA" address="0x00009888" value="0x16110103" />
+        <register type="NOA" address="0x00009888" value="0x1C110104" />
+        <register type="NOA" address="0x00009888" value="0x1E110105" />
+        <register type="NOA" address="0x00009888" value="0x02110106" />
+        <register type="NOA" address="0x00009888" value="0x04110107" />
+        <register type="NOA" address="0x00009888" value="0x10110000" />
+        <register type="NOA" address="0x00009888" value="0x0A110000" />
+        <register type="NOA" address="0x00009888" value="0x0E110000" />
+        <register type="NOA" address="0x00009888" value="0x00110000" />
+        <register type="NOA" address="0x00009888" value="0x16128000" />
+        <register type="NOA" address="0x00009888" value="0x1C128000" />
+        <register type="NOA" address="0x00009888" value="0x1E128000" />
+        <register type="NOA" address="0x00009888" value="0x02128000" />
+        <register type="NOA" address="0x00009888" value="0x04128000" />
+        <register type="NOA" address="0x00009888" value="0x1C132000" />
+        <register type="NOA" address="0x00009888" value="0x1E130003" />
+        <register type="NOA" address="0x00009888" value="0x12138000" />
+        <register type="NOA" address="0x00009888" value="0x14138000" />
+        <register type="NOA" address="0x00009888" value="0x14310103" />
+        <register type="NOA" address="0x00009888" value="0x06310104" />
+        <register type="NOA" address="0x00009888" value="0x08310105" />
+        <register type="NOA" address="0x00009888" value="0x0A310106" />
+        <register type="NOA" address="0x00009888" value="0x0C310107" />
+        <register type="NOA" address="0x00009888" value="0x10310000" />
+        <register type="NOA" address="0x00009888" value="0x02310000" />
+        <register type="NOA" address="0x00009888" value="0x04310000" />
+        <register type="NOA" address="0x00009888" value="0x14328000" />
+        <register type="NOA" address="0x00009888" value="0x06328000" />
+        <register type="NOA" address="0x00009888" value="0x08328000" />
+        <register type="NOA" address="0x00009888" value="0x0A328000" />
+        <register type="NOA" address="0x00009888" value="0x0C328000" />
+        <register type="NOA" address="0x00009888" value="0x1C331100" />
+        <register type="NOA" address="0x00009888" value="0x16338000" />
+        <register type="NOA" address="0x00009888" value="0x18338000" />
+        <register type="NOA" address="0x00009888" value="0x1A338000" />
+        <register type="NOA" address="0x00009888" value="0x12510103" />
+        <register type="NOA" address="0x00009888" value="0x10510000" />
+        <register type="NOA" address="0x00009888" value="0x08510000" />
+        <register type="NOA" address="0x00009888" value="0x12528000" />
+        <register type="NOA" address="0x00009888" value="0x1C530800" />
+        <register type="NOA" address="0x00009888" value="0x10710103" />
+        <register type="NOA" address="0x00009888" value="0x08710000" />
+        <register type="NOA" address="0x00009888" value="0x10728000" />
+        <register type="NOA" address="0x00009888" value="0x1C730400" />
+        <register type="NOA" address="0x00009888" value="0x0E910103" />
+        <register type="NOA" address="0x00009888" value="0x10910000" />
+        <register type="NOA" address="0x00009888" value="0x06910000" />
+        <register type="NOA" address="0x00009888" value="0x0E928000" />
+        <register type="NOA" address="0x00009888" value="0x1C930200" />
+        <register type="NOA" address="0x00009888" value="0x00B10103" />
+        <register type="NOA" address="0x00009888" value="0x10B10000" />
+        <register type="NOA" address="0x00009888" value="0x00B28000" />
+        <register type="NOA" address="0x00009888" value="0x10B38000" />
+        <register type="NOA" address="0x00009888" value="0x1C0F8000" />
+        <register type="NOA" address="0x00009888" value="0x10104000" />
+        <register type="NOA" address="0x00009888" value="0x10024000" />
+        <register type="NOA" address="0x00009888" value="0x1C032000" />
+        <register type="NOA" address="0x00009888" value="0x1E034000" />
+        <register type="NOA" address="0x00009888" value="0x18002000" />
+        <register type="NOA" address="0x00009888" value="0x360026CA" />
+        <register type="NOA" address="0x00009888" value="0x38002402" />
+        <register type="NOA" address="0x00009888" value="0x1A004000" />
+        <register type="NOA" address="0x00009888" value="0x1C004000" />
+        <register type="NOA" address="0x00009888" value="0x1E004000" />
+        <register type="NOA" address="0x00009888" value="0x34001200" />
+        <register type="NOA" address="0x00009888" value="0x00014000" />
+        <register type="NOA" address="0x00009888" value="0x1A012000" />
+        <register type="NOA" address="0x00009888" value="0x240582C0" />
+        <register type="NOA" address="0x00009888" value="0x26050002" />
+        <register type="NOA" address="0x00009888" value="0x2205FFA0" />
+        <register type="NOA" address="0x00009888" value="0x24060020" />
+        <register type="NOA" address="0x00009888" value="0x100A8000" />
+        <register type="NOA" address="0x00009888" value="0x120A8000" />
+        <register type="NOA" address="0x00009884" value="0x00000003" />
+        <register type="NOA" address="0x00009888" value="0x41104000" />
+        <register type="NOA" address="0x00009888" value="0x5B105555" />
+        <register type="NOA" address="0x00009888" value="0x5D101415" />
+        <register type="NOA" address="0x00009888" value="0x11148000" />
+        <register type="NOA" address="0x00009888" value="0x1B14FC00" />
+        <register type="NOA" address="0x00009888" value="0x1D140033" />
+        <register type="NOA" address="0x00009888" value="0x13148000" />
+        <register type="NOA" address="0x00009888" value="0x15148000" />
+        <register type="NOA" address="0x00009888" value="0x17148000" />
+        <register type="NOA" address="0x00009888" value="0x4B112000" />
+        <register type="NOA" address="0x00009888" value="0x5F115555" />
+        <register type="NOA" address="0x00009888" value="0x61111415" />
+        <register type="NOA" address="0x00009888" value="0x01128000" />
+        <register type="NOA" address="0x00009888" value="0x0F128000" />
+        <register type="NOA" address="0x00009888" value="0x11128000" />
+        <register type="NOA" address="0x00009888" value="0x13128000" />
+        <register type="NOA" address="0x00009888" value="0x15128000" />
+        <register type="NOA" address="0x00009888" value="0x17128000" />
+        <register type="NOA" address="0x00009888" value="0x1D128000" />
+        <register type="NOA" address="0x00009888" value="0x1F128000" />
+        <register type="NOA" address="0x00009888" value="0x03128000" />
+        <register type="NOA" address="0x00009888" value="0x05128000" />
+        <register type="NOA" address="0x00009888" value="0x07128000" />
+        <register type="NOA" address="0x00009888" value="0x09128000" />
+        <register type="NOA" address="0x00009888" value="0x0B128000" />
+        <register type="NOA" address="0x00009888" value="0x0D128000" />
+        <register type="NOA" address="0x00009888" value="0x47101600" />
+        <register type="NOA" address="0x00009888" value="0x4D100111" />
+        <register type="NOA" address="0x00009888" value="0x4F100006" />
+        <register type="NOA" address="0x00009888" value="0x51101114" />
+        <register type="NOA" address="0x00009888" value="0x53100001" />
+        <register type="NOA" address="0x00009888" value="0x17100000" />
+        <register type="NOA" address="0x00009888" value="0x31100000" />
+        <register type="NOA" address="0x00009888" value="0x55101110" />
+        <register type="NOA" address="0x00009888" value="0x57100001" />
+        <register type="NOA" address="0x00009888" value="0x49101111" />
+        <register type="NOA" address="0x00009888" value="0x4B101111" />
+        <register type="NOA" address="0x00009884" value="0x00000003" />
+        <register type="NOA" address="0x00009888" value="0x65100002" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x42000001" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x0000D920" value="0x00000000" />
+        <register type="OA" address="0x0000D900" value="0x00000000" />
+        <register type="OA" address="0x0000D904" value="0xF0800000" />
+        <register type="OA" address="0x0000D910" value="0x00000000" />
+        <register type="OA" address="0x0000D914" value="0xF0800000" />
+        <register type="OA" address="0x0000DC40" value="0x00FF0000" />
+        <register type="OA" address="0x0000D940" value="0x00000002" />
+        <register type="OA" address="0x0000D944" value="0x0000FFFE" />
+        <register type="OA" address="0x0000DC00" value="0x00000002" />
+        <register type="OA" address="0x0000DC04" value="0x0000FFFE" />
+        <register type="OA" address="0x0000D948" value="0x00000002" />
+        <register type="OA" address="0x0000D94C" value="0x0000FFFD" />
+        <register type="OA" address="0x0000DC08" value="0x00000002" />
+        <register type="OA" address="0x0000DC0C" value="0x0000FFFD" />
+        <register type="OA" address="0x0000D950" value="0x00000002" />
+        <register type="OA" address="0x0000D954" value="0x0000FFFB" />
+        <register type="OA" address="0x0000DC10" value="0x00000002" />
+        <register type="OA" address="0x0000DC14" value="0x0000FFFB" />
+        <register type="OA" address="0x0000D958" value="0x00000002" />
+        <register type="OA" address="0x0000D95C" value="0x0000FFF7" />
+        <register type="OA" address="0x0000DC18" value="0x00000002" />
+        <register type="OA" address="0x0000DC1C" value="0x0000FFF7" />
+        <register type="OA" address="0x0000D960" value="0x00000002" />
+        <register type="OA" address="0x0000D964" value="0x0000FFEF" />
+        <register type="OA" address="0x0000DC20" value="0x00000002" />
+        <register type="OA" address="0x0000DC24" value="0x0000FFEF" />
+        <register type="OA" address="0x0000D968" value="0x00000002" />
+        <register type="OA" address="0x0000D96C" value="0x0000FFDF" />
+        <register type="OA" address="0x0000DC28" value="0x00000002" />
+        <register type="OA" address="0x0000DC2C" value="0x0000FFDF" />
+        <register type="OA" address="0x0000D970" value="0x00007800" />
+        <register type="OA" address="0x0000D974" value="0x0000F0FF" />
+        <register type="OA" address="0x0000DC30" value="0x00007800" />
+        <register type="OA" address="0x0000DC34" value="0x0000F0FF" />
+        <register type="OA" address="0x0000D978" value="0x00078000" />
+        <register type="OA" address="0x0000D97C" value="0x00000FFF" />
+        <register type="OA" address="0x0000DC38" value="0x00078000" />
+        <register type="OA" address="0x0000DC3C" value="0x00000FFF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00008003" />
+    </register_config>
+  </set>
+
+  <set name="TDL_2"
+       mdapi_supported_apis="VK OGL OCL MEDIA IO"
+       underscore_name="tdl_2"
+       hw_config_guid="2a42ff25-99b1-4048-a121-f0664ed42c90"
+       chipset="TGL"
+       symbol_name="TDL_2"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Thread Header Ready on Slice0 DualSubslice5 Thread Dispatcher Port 1"
+             description="The percentage of time in which thread header is ready on slice0 dualsubslice5 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header05_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader05ReadyPort1"
+             availability="$DualSubsliceMask 32 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="dualsubslice"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Dualsubslice0 Thread Dispatcher"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 dualsubslice0 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread00_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread00ReadyForDispatch"
+             availability="$DualSubsliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="dualsubslice"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Dualsubslice3 Thread Dispatcher"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 dualsubslice3 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread03_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread03ReadyForDispatch"
+             availability="$DualSubsliceMask 8 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="dualsubslice"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO MEDIA"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU And EM Pipes Active"
+             description="The percentage of time in which EU FPU and EM pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_em_active"
+             units="percent"
+             symbol_name="EuFpuEmActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Dualsubslice1 Thread Dispatcher"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 dualsubslice1 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread01_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread01ReadyForDispatch"
+             availability="$DualSubsliceMask 2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="dualsubslice"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Dualsubslice2 Thread Dispatcher"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 dualsubslice2 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread02_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread02ReadyForDispatch"
+             availability="$DualSubsliceMask 4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="dualsubslice"
+             />
+    <counter name="EU Thread Occupancy"
+             description="The percentage of time in which hardware threads occupied EUs."
+             data_type="float"
+             max_equation="100"
+             equation="8 A 10 READ FMUL $EuThreadsCount FDIV $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_thread_occupancy"
+             units="percent"
+             symbol_name="EuThreadOccupancy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Thread Header Ready on Slice0 DualSubslice5 Thread Dispatcher Port 3"
+             description="The percentage of time in which thread header is ready on slice0 dualsubslice5 thread dispatcher port 3"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header05_ready_port3"
+             units="percent"
+             symbol_name="ThreadHeader05ReadyPort3"
+             availability="$DualSubsliceMask 32 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="dualsubslice"
+             />
+    <counter name="Thread Header Ready on Slice0 DualSubslice5 Thread Dispatcher Port 0"
+             description="The percentage of time in which thread header is ready on slice0 dualsubslice5 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header05_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader05ReadyPort0"
+             availability="$DualSubsliceMask 32 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="dualsubslice"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Dualsubslice5 Thread Dispatcher"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 dualsubslice5 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread05_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread05ReadyForDispatch"
+             availability="$DualSubsliceMask 32 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="dualsubslice"
+             />
+    <counter name="Thread Header Ready on Slice0 DualSubslice5 Thread Dispatcher"
+             description="The percentage of time in which thread header is ready on slice0 dualsubslice5 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header05_ready"
+             units="percent"
+             symbol_name="ThreadHeader05Ready"
+             availability="$DualSubsliceMask 32 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="dualsubslice"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Thread Header Ready on Slice0 DualSubslice5 Thread Dispatcher Port 2"
+             description="The percentage of time in which thread header is ready on slice0 dualsubslice5 thread dispatcher port 2"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header05_ready_port2"
+             units="percent"
+             symbol_name="ThreadHeader05ReadyPort2"
+             availability="$DualSubsliceMask 32 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="dualsubslice"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Dualsubslice4 Thread Dispatcher"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 dualsubslice4 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread04_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread04ReadyForDispatch"
+             availability="$DualSubsliceMask 16 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="dualsubslice"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009840" value="0x00000000" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x24110340" />
+        <register type="NOA" address="0x00009888" value="0x24310340" />
+        <register type="NOA" address="0x00009888" value="0x24510340" />
+        <register type="NOA" address="0x00009888" value="0x24710340" />
+        <register type="NOA" address="0x00009888" value="0x24910340" />
+        <register type="NOA" address="0x00009888" value="0x24B10340" />
+        <register type="NOA" address="0x00009888" value="0x26B1001C" />
+        <register type="NOA" address="0x00009888" value="0x1C07C000" />
+        <register type="NOA" address="0x00009888" value="0x2407002B" />
+        <register type="NOA" address="0x00009888" value="0x2207FF00" />
+        <register type="NOA" address="0x00009888" value="0x021100F3" />
+        <register type="NOA" address="0x00009888" value="0x041100F2" />
+        <register type="NOA" address="0x00009888" value="0x10110000" />
+        <register type="NOA" address="0x00009888" value="0x00110000" />
+        <register type="NOA" address="0x00009888" value="0x02128000" />
+        <register type="NOA" address="0x00009888" value="0x04128000" />
+        <register type="NOA" address="0x00009888" value="0x12138000" />
+        <register type="NOA" address="0x00009888" value="0x14138000" />
+        <register type="NOA" address="0x00009888" value="0x1C3100F3" />
+        <register type="NOA" address="0x00009888" value="0x1E3100F2" />
+        <register type="NOA" address="0x00009888" value="0x10310000" />
+        <register type="NOA" address="0x00009888" value="0x0E310000" />
+        <register type="NOA" address="0x00009888" value="0x1C328000" />
+        <register type="NOA" address="0x00009888" value="0x1E328000" />
+        <register type="NOA" address="0x00009888" value="0x1E330003" />
+        <register type="NOA" address="0x00009888" value="0x185100F3" />
+        <register type="NOA" address="0x00009888" value="0x1A5100F2" />
+        <register type="NOA" address="0x00009888" value="0x10510000" />
+        <register type="NOA" address="0x00009888" value="0x0C510000" />
+        <register type="NOA" address="0x00009888" value="0x18528000" />
+        <register type="NOA" address="0x00009888" value="0x1A528000" />
+        <register type="NOA" address="0x00009888" value="0x1C53C000" />
+        <register type="NOA" address="0x00009888" value="0x147100F3" />
+        <register type="NOA" address="0x00009888" value="0x167100F2" />
+        <register type="NOA" address="0x00009888" value="0x10710000" />
+        <register type="NOA" address="0x00009888" value="0x0A710000" />
+        <register type="NOA" address="0x00009888" value="0x14728000" />
+        <register type="NOA" address="0x00009888" value="0x16728000" />
+        <register type="NOA" address="0x00009888" value="0x1C733000" />
+        <register type="NOA" address="0x00009888" value="0x109100F3" />
+        <register type="NOA" address="0x00009888" value="0x129100F2" />
+        <register type="NOA" address="0x00009888" value="0x08910000" />
+        <register type="NOA" address="0x00009888" value="0x10928000" />
+        <register type="NOA" address="0x00009888" value="0x12928000" />
+        <register type="NOA" address="0x00009888" value="0x1C930C00" />
+        <register type="NOA" address="0x00009888" value="0x00B100F3" />
+        <register type="NOA" address="0x00009888" value="0x0EB100F2" />
+        <register type="NOA" address="0x00009888" value="0x06B10104" />
+        <register type="NOA" address="0x00009888" value="0x08B10105" />
+        <register type="NOA" address="0x00009888" value="0x0AB10106" />
+        <register type="NOA" address="0x00009888" value="0x0CB10107" />
+        <register type="NOA" address="0x00009888" value="0x10B10000" />
+        <register type="NOA" address="0x00009888" value="0x02B10000" />
+        <register type="NOA" address="0x00009888" value="0x04B10000" />
+        <register type="NOA" address="0x00009888" value="0x00B28000" />
+        <register type="NOA" address="0x00009888" value="0x0EB28000" />
+        <register type="NOA" address="0x00009888" value="0x06B28000" />
+        <register type="NOA" address="0x00009888" value="0x08B28000" />
+        <register type="NOA" address="0x00009888" value="0x0AB28000" />
+        <register type="NOA" address="0x00009888" value="0x0CB28000" />
+        <register type="NOA" address="0x00009888" value="0x10B38000" />
+        <register type="NOA" address="0x00009888" value="0x1CB30300" />
+        <register type="NOA" address="0x00009888" value="0x16B38000" />
+        <register type="NOA" address="0x00009888" value="0x18B38000" />
+        <register type="NOA" address="0x00009888" value="0x1AB38000" />
+        <register type="NOA" address="0x00009888" value="0x1E0F0028" />
+        <register type="NOA" address="0x00009888" value="0x14104000" />
+        <register type="NOA" address="0x00009888" value="0x16104000" />
+        <register type="NOA" address="0x00009888" value="0x2C024000" />
+        <register type="NOA" address="0x00009888" value="0x2E020001" />
+        <register type="NOA" address="0x00009888" value="0x2A03A500" />
+        <register type="NOA" address="0x00009888" value="0x18002000" />
+        <register type="NOA" address="0x00009888" value="0x36003249" />
+        <register type="NOA" address="0x00009888" value="0x380024DB" />
+        <register type="NOA" address="0x00009888" value="0x1A004000" />
+        <register type="NOA" address="0x00009888" value="0x1C004000" />
+        <register type="NOA" address="0x00009888" value="0x1E002000" />
+        <register type="NOA" address="0x00009888" value="0x34000900" />
+        <register type="NOA" address="0x00009888" value="0x00014000" />
+        <register type="NOA" address="0x00009888" value="0x1A012000" />
+        <register type="NOA" address="0x00009888" value="0x1C012000" />
+        <register type="NOA" address="0x00009888" value="0x1E012000" />
+        <register type="NOA" address="0x00009888" value="0x06014000" />
+        <register type="NOA" address="0x00009888" value="0x08014000" />
+        <register type="NOA" address="0x00009888" value="0x0A014000" />
+        <register type="NOA" address="0x00009888" value="0x18012000" />
+        <register type="NOA" address="0x00009888" value="0x2405C000" />
+        <register type="NOA" address="0x00009888" value="0x26050003" />
+        <register type="NOA" address="0x00009888" value="0x220500A0" />
+        <register type="NOA" address="0x00009888" value="0x24062800" />
+        <register type="NOA" address="0x00009888" value="0x140A8000" />
+        <register type="NOA" address="0x00009888" value="0x160A8000" />
+        <register type="NOA" address="0x00009888" value="0x180A8000" />
+        <register type="NOA" address="0x00009888" value="0x1A0A8000" />
+        <register type="NOA" address="0x00009884" value="0x00000003" />
+        <register type="NOA" address="0x00009888" value="0x41104000" />
+        <register type="NOA" address="0x00009888" value="0x5B105555" />
+        <register type="NOA" address="0x00009888" value="0x5D101555" />
+        <register type="NOA" address="0x00009888" value="0x11148000" />
+        <register type="NOA" address="0x00009888" value="0x1B14FC00" />
+        <register type="NOA" address="0x00009888" value="0x1D14003F" />
+        <register type="NOA" address="0x00009888" value="0x13148000" />
+        <register type="NOA" address="0x00009888" value="0x15148000" />
+        <register type="NOA" address="0x00009888" value="0x17148000" />
+        <register type="NOA" address="0x00009888" value="0x4B112000" />
+        <register type="NOA" address="0x00009888" value="0x5F115555" />
+        <register type="NOA" address="0x00009888" value="0x61111555" />
+        <register type="NOA" address="0x00009888" value="0x01128000" />
+        <register type="NOA" address="0x00009888" value="0x0F128000" />
+        <register type="NOA" address="0x00009888" value="0x11128000" />
+        <register type="NOA" address="0x00009888" value="0x13128000" />
+        <register type="NOA" address="0x00009888" value="0x15128000" />
+        <register type="NOA" address="0x00009888" value="0x17128000" />
+        <register type="NOA" address="0x00009888" value="0x19128000" />
+        <register type="NOA" address="0x00009888" value="0x1B128000" />
+        <register type="NOA" address="0x00009888" value="0x1D128000" />
+        <register type="NOA" address="0x00009888" value="0x1F128000" />
+        <register type="NOA" address="0x00009888" value="0x03128000" />
+        <register type="NOA" address="0x00009888" value="0x05128000" />
+        <register type="NOA" address="0x00009888" value="0x07128000" />
+        <register type="NOA" address="0x00009888" value="0x09128000" />
+        <register type="NOA" address="0x00009888" value="0x0B128000" />
+        <register type="NOA" address="0x00009888" value="0x0D128000" />
+        <register type="NOA" address="0x00009888" value="0x47101600" />
+        <register type="NOA" address="0x00009888" value="0x4D100606" />
+        <register type="NOA" address="0x00009888" value="0x4F100606" />
+        <register type="NOA" address="0x00009888" value="0x51100006" />
+        <register type="NOA" address="0x00009888" value="0x53100400" />
+        <register type="NOA" address="0x00009888" value="0x55101114" />
+        <register type="NOA" address="0x00009888" value="0x17100000" />
+        <register type="NOA" address="0x00009888" value="0x31100000" />
+        <register type="NOA" address="0x00009888" value="0x57100001" />
+        <register type="NOA" address="0x00009888" value="0x49100111" />
+        <register type="NOA" address="0x00009888" value="0x4B100606" />
+        <register type="NOA" address="0x00009884" value="0x00000003" />
+        <register type="NOA" address="0x00009888" value="0x65100002" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x42000001" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x0000D920" value="0x00000000" />
+        <register type="OA" address="0x0000D900" value="0x00000000" />
+        <register type="OA" address="0x0000D904" value="0xF0800000" />
+        <register type="OA" address="0x0000D910" value="0x00000000" />
+        <register type="OA" address="0x0000D914" value="0x70800000" />
+        <register type="OA" address="0x0000DC40" value="0x007F0000" />
+        <register type="OA" address="0x0000D940" value="0x00000000" />
+        <register type="OA" address="0x0000D944" value="0x0000FFFC" />
+        <register type="OA" address="0x0000DC00" value="0x00000000" />
+        <register type="OA" address="0x0000DC04" value="0x0000FFFC" />
+        <register type="OA" address="0x0000D948" value="0x00000000" />
+        <register type="OA" address="0x0000D94C" value="0x0000FFF3" />
+        <register type="OA" address="0x0000DC08" value="0x00000000" />
+        <register type="OA" address="0x0000DC0C" value="0x0000FFF3" />
+        <register type="OA" address="0x0000D950" value="0x00000000" />
+        <register type="OA" address="0x0000D954" value="0x0000FFCF" />
+        <register type="OA" address="0x0000DC10" value="0x00000000" />
+        <register type="OA" address="0x0000DC14" value="0x0000FFCF" />
+        <register type="OA" address="0x0000D958" value="0x00000000" />
+        <register type="OA" address="0x0000D95C" value="0x0000FF3F" />
+        <register type="OA" address="0x0000DC18" value="0x00000000" />
+        <register type="OA" address="0x0000DC1C" value="0x0000FF3F" />
+        <register type="OA" address="0x0000D960" value="0x00000000" />
+        <register type="OA" address="0x0000D964" value="0x0000FCFF" />
+        <register type="OA" address="0x0000DC20" value="0x00000000" />
+        <register type="OA" address="0x0000DC24" value="0x0000FCFF" />
+        <register type="OA" address="0x0000D968" value="0x00000000" />
+        <register type="OA" address="0x0000D96C" value="0x0000F3FF" />
+        <register type="OA" address="0x0000DC28" value="0x00000000" />
+        <register type="OA" address="0x0000DC2C" value="0x0000F3FF" />
+        <register type="OA" address="0x0000D970" value="0x00078000" />
+        <register type="OA" address="0x0000D974" value="0x00000FFF" />
+        <register type="OA" address="0x0000DC30" value="0x00078000" />
+        <register type="OA" address="0x0000DC34" value="0x00000FFF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00008003" />
+    </register_config>
+  </set>
+
+  <set name="TDL_3"
+       mdapi_supported_apis="VK OGL OCL MEDIA IO"
+       underscore_name="tdl_3"
+       hw_config_guid="b763fa13-834e-4468-bba6-5f0d40db9813"
+       chipset="TGL"
+       symbol_name="TDL_3"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Thread Header Ready on Slice0 DualSubslice3 Thread Dispatcher"
+             description="The percentage of time in which thread header is ready on slice0 dualsubslice3 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header03_ready"
+             units="percent"
+             symbol_name="ThreadHeader03Ready"
+             availability="$DualSubsliceMask 8 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="dualsubslice"
+             />
+    <counter name="Thread Header Ready on Slice0 DualSubslice3 Thread Dispatcher Port 3"
+             description="The percentage of time in which thread header is ready on slice0 dualsubslice3 thread dispatcher port 3"
+             data_type="float"
+             max_equation="100"
+             equation="C 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header03_ready_port3"
+             units="percent"
+             symbol_name="ThreadHeader03ReadyPort3"
+             availability="$DualSubsliceMask 8 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="dualsubslice"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="Thread Header Ready on Slice0 DualSubslice3 Thread Dispatcher Port 0"
+             description="The percentage of time in which thread header is ready on slice0 dualsubslice3 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header03_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader03ReadyPort0"
+             availability="$DualSubsliceMask 8 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="dualsubslice"
+             />
+    <counter name="Thread Header Ready on Slice0 DualSubslice3 Thread Dispatcher Port 1"
+             description="The percentage of time in which thread header is ready on slice0 dualsubslice3 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header03_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader03ReadyPort1"
+             availability="$DualSubsliceMask 8 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="dualsubslice"
+             />
+    <counter name="Thread Header Ready on Slice0 DualSubslice3 Thread Dispatcher Port 2"
+             description="The percentage of time in which thread header is ready on slice0 dualsubslice3 thread dispatcher port 2"
+             data_type="float"
+             max_equation="100"
+             equation="C 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header03_ready_port2"
+             units="percent"
+             symbol_name="ThreadHeader03ReadyPort2"
+             availability="$DualSubsliceMask 8 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="dualsubslice"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Thread Header Ready on Slice0 DualSubslice4 Thread Dispatcher Port 3"
+             description="The percentage of time in which thread header is ready on slice0 dualsubslice4 thread dispatcher port 3"
+             data_type="float"
+             max_equation="100"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header04_ready_port3"
+             units="percent"
+             symbol_name="ThreadHeader04ReadyPort3"
+             availability="$DualSubsliceMask 16 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="dualsubslice"
+             />
+    <counter name="Thread Header Ready on Slice0 DualSubslice4 Thread Dispatcher Port 2"
+             description="The percentage of time in which thread header is ready on slice0 dualsubslice4 thread dispatcher port 2"
+             data_type="float"
+             max_equation="100"
+             equation="B 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header04_ready_port2"
+             units="percent"
+             symbol_name="ThreadHeader04ReadyPort2"
+             availability="$DualSubsliceMask 16 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="dualsubslice"
+             />
+    <counter name="Thread Header Ready on Slice0 DualSubslice4 Thread Dispatcher Port 1"
+             description="The percentage of time in which thread header is ready on slice0 dualsubslice4 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="B 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header04_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader04ReadyPort1"
+             availability="$DualSubsliceMask 16 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="dualsubslice"
+             />
+    <counter name="Thread Header Ready on Slice0 DualSubslice4 Thread Dispatcher Port 0"
+             description="The percentage of time in which thread header is ready on slice0 dualsubslice4 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="B 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header04_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader04ReadyPort0"
+             availability="$DualSubsliceMask 16 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="dualsubslice"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO MEDIA"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="Thread Header Ready on Slice0 DualSubslice4 Thread Dispatcher"
+             description="The percentage of time in which thread header is ready on slice0 dualsubslice4 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header04_ready"
+             units="percent"
+             symbol_name="ThreadHeader04Ready"
+             availability="$DualSubsliceMask 16 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="dualsubslice"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Thread Header Ready on Slice0 DualSubslice2 Thread Dispatcher Port 1"
+             description="The percentage of time in which thread header is ready on slice0 dualsubslice2 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header02_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader02ReadyPort1"
+             availability="$DualSubsliceMask 4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="dualsubslice"
+             />
+    <counter name="Thread Header Ready on Slice0 DualSubslice2 Thread Dispatcher Port 0"
+             description="The percentage of time in which thread header is ready on slice0 dualsubslice2 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header02_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader02ReadyPort0"
+             availability="$DualSubsliceMask 4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="dualsubslice"
+             />
+    <counter name="Thread Header Ready on Slice0 DualSubslice2 Thread Dispatcher Port 3"
+             description="The percentage of time in which thread header is ready on slice0 dualsubslice2 thread dispatcher port 3"
+             data_type="float"
+             max_equation="100"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header02_ready_port3"
+             units="percent"
+             symbol_name="ThreadHeader02ReadyPort3"
+             availability="$DualSubsliceMask 4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="dualsubslice"
+             />
+    <counter name="Thread Header Ready on Slice0 DualSubslice2 Thread Dispatcher Port 2"
+             description="The percentage of time in which thread header is ready on slice0 dualsubslice2 thread dispatcher port 2"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header02_ready_port2"
+             units="percent"
+             symbol_name="ThreadHeader02ReadyPort2"
+             availability="$DualSubsliceMask 4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="dualsubslice"
+             />
+    <counter name="EU FPU And EM Pipes Active"
+             description="The percentage of time in which EU FPU and EM pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_em_active"
+             units="percent"
+             symbol_name="EuFpuEmActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="EU Thread Occupancy"
+             description="The percentage of time in which hardware threads occupied EUs."
+             data_type="float"
+             max_equation="100"
+             equation="8 A 10 READ FMUL $EuThreadsCount FDIV $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_thread_occupancy"
+             units="percent"
+             symbol_name="EuThreadOccupancy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="Thread Header Ready on Slice0 DualSubslice2 Thread Dispatcher"
+             description="The percentage of time in which thread header is ready on slice0 dualsubslice2 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header02_ready"
+             units="percent"
+             symbol_name="ThreadHeader02Ready"
+             availability="$DualSubsliceMask 4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="dualsubslice"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009840" value="0x00000000" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x2651001C" />
+        <register type="NOA" address="0x00009888" value="0x2671001C" />
+        <register type="NOA" address="0x00009888" value="0x2691001C" />
+        <register type="NOA" address="0x00009888" value="0x24072A80" />
+        <register type="NOA" address="0x00009888" value="0x06510107" />
+        <register type="NOA" address="0x00009888" value="0x08510106" />
+        <register type="NOA" address="0x00009888" value="0x0A510105" />
+        <register type="NOA" address="0x00009888" value="0x0C510104" />
+        <register type="NOA" address="0x00009888" value="0x10510000" />
+        <register type="NOA" address="0x00009888" value="0x02510000" />
+        <register type="NOA" address="0x00009888" value="0x04510000" />
+        <register type="NOA" address="0x00009888" value="0x06528000" />
+        <register type="NOA" address="0x00009888" value="0x08528000" />
+        <register type="NOA" address="0x00009888" value="0x0A528000" />
+        <register type="NOA" address="0x00009888" value="0x0C528000" />
+        <register type="NOA" address="0x00009888" value="0x16538000" />
+        <register type="NOA" address="0x00009888" value="0x18538000" />
+        <register type="NOA" address="0x00009888" value="0x1A538000" />
+        <register type="NOA" address="0x00009888" value="0x1C530100" />
+        <register type="NOA" address="0x00009888" value="0x1C710107" />
+        <register type="NOA" address="0x00009888" value="0x1E710106" />
+        <register type="NOA" address="0x00009888" value="0x02710105" />
+        <register type="NOA" address="0x00009888" value="0x04710104" />
+        <register type="NOA" address="0x00009888" value="0x10710000" />
+        <register type="NOA" address="0x00009888" value="0x0E710000" />
+        <register type="NOA" address="0x00009888" value="0x00710000" />
+        <register type="NOA" address="0x00009888" value="0x1C728000" />
+        <register type="NOA" address="0x00009888" value="0x1E728000" />
+        <register type="NOA" address="0x00009888" value="0x02728000" />
+        <register type="NOA" address="0x00009888" value="0x04728000" />
+        <register type="NOA" address="0x00009888" value="0x1E730003" />
+        <register type="NOA" address="0x00009888" value="0x12738000" />
+        <register type="NOA" address="0x00009888" value="0x14738000" />
+        <register type="NOA" address="0x00009888" value="0x14910107" />
+        <register type="NOA" address="0x00009888" value="0x16910106" />
+        <register type="NOA" address="0x00009888" value="0x18910105" />
+        <register type="NOA" address="0x00009888" value="0x1A910104" />
+        <register type="NOA" address="0x00009888" value="0x10910000" />
+        <register type="NOA" address="0x00009888" value="0x0A910000" />
+        <register type="NOA" address="0x00009888" value="0x0C910000" />
+        <register type="NOA" address="0x00009888" value="0x14928000" />
+        <register type="NOA" address="0x00009888" value="0x16928000" />
+        <register type="NOA" address="0x00009888" value="0x18928000" />
+        <register type="NOA" address="0x00009888" value="0x1A928000" />
+        <register type="NOA" address="0x00009888" value="0x1C93F000" />
+        <register type="NOA" address="0x00009888" value="0x1E0F2800" />
+        <register type="NOA" address="0x00009888" value="0x1C0F000A" />
+        <register type="NOA" address="0x00009888" value="0x1C104000" />
+        <register type="NOA" address="0x00009888" value="0x1E104000" />
+        <register type="NOA" address="0x00009888" value="0x02104000" />
+        <register type="NOA" address="0x00009888" value="0x04104000" />
+        <register type="NOA" address="0x00009888" value="0x2E020140" />
+        <register type="NOA" address="0x00009888" value="0x02024000" />
+        <register type="NOA" address="0x00009888" value="0x04024000" />
+        <register type="NOA" address="0x00009888" value="0x2C030005" />
+        <register type="NOA" address="0x00009888" value="0x02034000" />
+        <register type="NOA" address="0x00009888" value="0x04034000" />
+        <register type="NOA" address="0x00009888" value="0x06038000" />
+        <register type="NOA" address="0x00009888" value="0x08038000" />
+        <register type="NOA" address="0x00009888" value="0x0A038000" />
+        <register type="NOA" address="0x00009888" value="0x18034000" />
+        <register type="NOA" address="0x00009888" value="0x36001003" />
+        <register type="NOA" address="0x00009888" value="0x38003649" />
+        <register type="NOA" address="0x00009888" value="0x1A006000" />
+        <register type="NOA" address="0x00009888" value="0x1C006000" />
+        <register type="NOA" address="0x00009888" value="0x1E006000" />
+        <register type="NOA" address="0x00009888" value="0x34001B00" />
+        <register type="NOA" address="0x00009888" value="0x2A015500" />
+        <register type="NOA" address="0x00009888" value="0x2206AA00" />
+        <register type="NOA" address="0x00009888" value="0x1C0A8000" />
+        <register type="NOA" address="0x00009888" value="0x1E0A8000" />
+        <register type="NOA" address="0x00009888" value="0x020A8000" />
+        <register type="NOA" address="0x00009888" value="0x040A8000" />
+        <register type="NOA" address="0x00009888" value="0x060A8000" />
+        <register type="NOA" address="0x00009888" value="0x080A8000" />
+        <register type="NOA" address="0x00009888" value="0x0A0A8000" />
+        <register type="NOA" address="0x00009888" value="0x0C0A8000" />
+        <register type="NOA" address="0x00009884" value="0x00000003" />
+        <register type="NOA" address="0x00009888" value="0x5D101554" />
+        <register type="NOA" address="0x00009888" value="0x5B100555" />
+        <register type="NOA" address="0x00009888" value="0x1D14003F" />
+        <register type="NOA" address="0x00009888" value="0x13148000" />
+        <register type="NOA" address="0x00009888" value="0x15148000" />
+        <register type="NOA" address="0x00009888" value="0x17148000" />
+        <register type="NOA" address="0x00009888" value="0x1B141C00" />
+        <register type="NOA" address="0x00009888" value="0x61111554" />
+        <register type="NOA" address="0x00009888" value="0x5F110555" />
+        <register type="NOA" address="0x00009888" value="0x15128000" />
+        <register type="NOA" address="0x00009888" value="0x17128000" />
+        <register type="NOA" address="0x00009888" value="0x19128000" />
+        <register type="NOA" address="0x00009888" value="0x1B128000" />
+        <register type="NOA" address="0x00009888" value="0x1D128000" />
+        <register type="NOA" address="0x00009888" value="0x1F128000" />
+        <register type="NOA" address="0x00009888" value="0x03128000" />
+        <register type="NOA" address="0x00009888" value="0x05128000" />
+        <register type="NOA" address="0x00009888" value="0x07128000" />
+        <register type="NOA" address="0x00009888" value="0x09128000" />
+        <register type="NOA" address="0x00009888" value="0x0B128000" />
+        <register type="NOA" address="0x00009888" value="0x0D128000" />
+        <register type="NOA" address="0x00009888" value="0x51100600" />
+        <register type="NOA" address="0x00009888" value="0x53100606" />
+        <register type="NOA" address="0x00009888" value="0x55100006" />
+        <register type="NOA" address="0x00009888" value="0x17100000" />
+        <register type="NOA" address="0x00009888" value="0x31100000" />
+        <register type="NOA" address="0x00009888" value="0x57100000" />
+        <register type="NOA" address="0x00009888" value="0x47100000" />
+        <register type="NOA" address="0x00009888" value="0x49100000" />
+        <register type="NOA" address="0x00009888" value="0x4B100404" />
+        <register type="NOA" address="0x00009888" value="0x4D100404" />
+        <register type="NOA" address="0x00009884" value="0x00000003" />
+        <register type="NOA" address="0x00009888" value="0x65100002" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x42000001" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x0000D920" value="0x00000000" />
+        <register type="OA" address="0x0000D900" value="0x00000000" />
+        <register type="OA" address="0x0000D904" value="0x70800000" />
+        <register type="OA" address="0x0000D910" value="0x00000000" />
+        <register type="OA" address="0x0000D914" value="0x00800000" />
+        <register type="OA" address="0x0000DC40" value="0x00070000" />
+        <register type="OA" address="0x0000D940" value="0x00078000" />
+        <register type="OA" address="0x0000D944" value="0x00000FFF" />
+        <register type="OA" address="0x0000DC00" value="0x00078000" />
+        <register type="OA" address="0x0000DC04" value="0x00000FFF" />
+        <register type="OA" address="0x0000D948" value="0x00007800" />
+        <register type="OA" address="0x0000D94C" value="0x0000F0FF" />
+        <register type="OA" address="0x0000DC08" value="0x00007800" />
+        <register type="OA" address="0x0000DC0C" value="0x0000F0FF" />
+        <register type="OA" address="0x0000D950" value="0x00000780" />
+        <register type="OA" address="0x0000D954" value="0x0000FF0F" />
+        <register type="OA" address="0x0000DC10" value="0x00000780" />
+        <register type="OA" address="0x0000DC14" value="0x0000FF0F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00008003" />
+    </register_config>
+  </set>
+
+  <set name="GpuBusyness"
+       mdapi_supported_apis="VK OGL OCL MEDIA IO"
+       underscore_name="gpu_busyness"
+       hw_config_guid="cc935a3e-8d96-4b47-bc46-3d84247e9a3a"
+       chipset="TGL"
+       symbol_name="GpuBusyness"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Vebox Ring Busy"
+             description="The percentage of time when vebox command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vebox_busy"
+             units="percent"
+             symbol_name="VeboxBusy"
+             semantic_type="duration"
+             mdapi_supported_apis="IO"
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Any Engine Busy"
+             description="The percentage of time when any command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="any_engine_busy"
+             units="percent"
+             symbol_name="AnyEngineBusy"
+             semantic_type="duration"
+             mdapi_supported_apis="IO"
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Compute Ring Busy"
+             description="The percentage of time when render command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="compute_busy"
+             units="percent"
+             symbol_name="ComputeBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Render Ring Busy"
+             description="The percentage of time when render command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="render_busy"
+             units="percent"
+             symbol_name="RenderBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL OCL IO MEDIA"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="Posh Ring Busy"
+             description="The percentage of time when posh command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="posh_engine_busy"
+             units="percent"
+             symbol_name="PoshEngineBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Vdbox1 Ring Busy"
+             description="The percentage of time when Vdbox1 command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vdbox1_busy"
+             units="percent"
+             symbol_name="Vdbox1Busy"
+             semantic_type="duration"
+             mdapi_supported_apis="IO"
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU And EM Pipes Active"
+             description="The percentage of time in which EU FPU and EM pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_em_active"
+             units="percent"
+             symbol_name="EuFpuEmActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Render and compute engines are simultaneously busy"
+             description="The percentage of time when render and compute engines are simultaneously busy"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="render_and_compute_busy"
+             units="percent"
+             symbol_name="RenderAndComputeBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Vdbox0 Ring Busy"
+             description="The percentage of time when Vdbox0 command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vdbox0_busy"
+             units="percent"
+             symbol_name="Vdbox0Busy"
+             semantic_type="duration"
+             mdapi_supported_apis="IO"
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="EU Thread Occupancy"
+             description="The percentage of time in which hardware threads occupied EUs."
+             data_type="float"
+             max_equation="100"
+             equation="8 A 10 READ FMUL $EuThreadsCount FDIV $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_thread_occupancy"
+             units="percent"
+             symbol_name="EuThreadOccupancy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="VK OGL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="Blitter Ring Busy"
+             description="The percentage of time when blitter command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="blitter_busy"
+             units="percent"
+             symbol_name="BlitterBusy"
+             semantic_type="duration"
+             mdapi_supported_apis="IO"
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009840" value="0x00000000" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x0E0E1200" />
+        <register type="NOA" address="0x00009888" value="0x220E0009" />
+        <register type="NOA" address="0x00009888" value="0x0E101200" />
+        <register type="NOA" address="0x00009888" value="0x040E0043" />
+        <register type="NOA" address="0x00009888" value="0x0A0E00B3" />
+        <register type="NOA" address="0x00009888" value="0x180E0000" />
+        <register type="NOA" address="0x00009888" value="0x0C0E0000" />
+        <register type="NOA" address="0x00009888" value="0x1C0F0104" />
+        <register type="NOA" address="0x00009888" value="0x08100053" />
+        <register type="NOA" address="0x00009888" value="0x20100000" />
+        <register type="NOA" address="0x00009888" value="0x04104000" />
+        <register type="NOA" address="0x00009888" value="0x0A104000" />
+        <register type="NOA" address="0x00009888" value="0x04024000" />
+        <register type="NOA" address="0x00009888" value="0x08024000" />
+        <register type="NOA" address="0x00009888" value="0x0A024000" />
+        <register type="NOA" address="0x00009888" value="0x04034000" />
+        <register type="NOA" address="0x00009888" value="0x08034000" />
+        <register type="NOA" address="0x00009888" value="0x0A034000" />
+        <register type="NOA" address="0x00009888" value="0x1C006000" />
+        <register type="NOA" address="0x00009888" value="0x34001B00" />
+        <register type="NOA" address="0x00009888" value="0x040A8000" />
+        <register type="NOA" address="0x00009888" value="0x080A8000" />
+        <register type="NOA" address="0x00009888" value="0x0A0A8000" />
+        <register type="NOA" address="0x00009884" value="0x00000003" />
+        <register type="NOA" address="0x00009888" value="0x15102400" />
+        <register type="NOA" address="0x00009888" value="0x230B0120" />
+        <register type="NOA" address="0x00009888" value="0x15182400" />
+        <register type="NOA" address="0x00009888" value="0x232B0120" />
+        <register type="NOA" address="0x00009888" value="0x17100023" />
+        <register type="NOA" address="0x00009888" value="0x11100000" />
+        <register type="NOA" address="0x00009888" value="0x5D101000" />
+        <register type="NOA" address="0x00009888" value="0x5B100545" />
+        <register type="NOA" address="0x00009888" value="0x15148000" />
+        <register type="NOA" address="0x00009888" value="0x1B140C00" />
+        <register type="NOA" address="0x00009888" value="0x61112000" />
+        <register type="NOA" address="0x00009888" value="0x5F110945" />
+        <register type="NOA" address="0x00009888" value="0x03124000" />
+        <register type="NOA" address="0x00009888" value="0x05128000" />
+        <register type="NOA" address="0x00009888" value="0x09128000" />
+        <register type="NOA" address="0x00009888" value="0x0B128000" />
+        <register type="NOA" address="0x00009888" value="0x13138000" />
+        <register type="NOA" address="0x00009888" value="0x1B0D0040" />
+        <register type="NOA" address="0x00009888" value="0x1F0B00D3" />
+        <register type="NOA" address="0x00009888" value="0x190B0000" />
+        <register type="NOA" address="0x00009888" value="0x170B0000" />
+        <register type="NOA" address="0x00009888" value="0x1B170002" />
+        <register type="NOA" address="0x00009888" value="0x0D174000" />
+        <register type="NOA" address="0x00009888" value="0x071800A3" />
+        <register type="NOA" address="0x00009888" value="0x11180000" />
+        <register type="NOA" address="0x00009888" value="0x032D4000" />
+        <register type="NOA" address="0x00009888" value="0x032B00D3" />
+        <register type="NOA" address="0x00009888" value="0x192B0000" />
+        <register type="NOA" address="0x00009888" value="0x092B0000" />
+        <register type="NOA" address="0x00009888" value="0x55103000" />
+        <register type="NOA" address="0x00009888" value="0x57100000" />
+        <register type="NOA" address="0x00009888" value="0x47101000" />
+        <register type="NOA" address="0x00009888" value="0x49107003" />
+        <register type="NOA" address="0x00009888" value="0x4B100402" />
+        <register type="NOA" address="0x00009888" value="0x4D100230" />
+        <register type="NOA" address="0x00009888" value="0x31100000" />
+        <register type="NOA" address="0x00009884" value="0x00000003" />
+        <register type="NOA" address="0x00009888" value="0x65100002" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x42000001" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x0000D920" value="0x00000000" />
+        <register type="OA" address="0x0000D900" value="0x00000000" />
+        <register type="OA" address="0x0000D904" value="0x30800000" />
+        <register type="OA" address="0x0000D910" value="0x00000000" />
+        <register type="OA" address="0x0000D914" value="0x00800000" />
+        <register type="OA" address="0x0000DC40" value="0x00030000" />
+        <register type="OA" address="0x0000D940" value="0x00024002" />
+        <register type="OA" address="0x0000D944" value="0x0000B7FF" />
+        <register type="OA" address="0x0000DC00" value="0x00024002" />
+        <register type="OA" address="0x0000DC04" value="0x0000B7FF" />
+        <register type="OA" address="0x0000D948" value="0x0007F000" />
+        <register type="OA" address="0x0000D94C" value="0x000001FF" />
+        <register type="OA" address="0x0000DC08" value="0x0007F000" />
+        <register type="OA" address="0x0000DC0C" value="0x000001FF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00008003" />
+    </register_config>
+  </set>
+
+  <set name="Metric set TestOa"
+       mdapi_supported_apis="VK OGL OCL IO"
+       underscore_name="test_oa"
+       hw_config_guid="30801299-fe7b-40ba-8a6c-64c6196f3748"
+       chipset="TGL"
+       symbol_name="TestOa"
+       >
+    <counter name="TestCounter7"
+             description="HW test counter 7. Factor: 0.6666"
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="counter7"
+             units="events"
+             symbol_name="Counter7"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="TestCounter8"
+             description="HW test counter 8. Should be equal to 1 in IOStream or in OAG query mode"
+             data_type="uint64"
+             equation="C 0 READ"
+             underscore_name="counter8"
+             units="events"
+             symbol_name="Counter8"
+             semantic_type="event"
+             mdapi_supported_apis="IO"
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter9 - OAR enable"
+             description="HW test counter 9. Should be equal to 1 in query."
+             data_type="uint64"
+             equation="C 1 READ"
+             underscore_name="counter9"
+             units="events"
+             symbol_name="Counter9"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL MEDIA VK"
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter4"
+             description="HW test counter 4. Factor: 0.3333"
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="counter4"
+             units="events"
+             symbol_name="Counter4"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter5"
+             description="HW test counter 5. Factor: 0.3333"
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="counter5"
+             units="events"
+             symbol_name="Counter5"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter6"
+             description="HW test counter 6. Factor: 0.16666"
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="counter6"
+             units="events"
+             symbol_name="Counter6"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter3"
+             description="HW test counter 3. Factor: 0.5"
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="counter3"
+             units="events"
+             symbol_name="Counter3"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter0"
+             description="HW test counter 0. Factor: 0.0"
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="counter0"
+             units="events"
+             symbol_name="Counter0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter1"
+             description="HW test counter 1. Factor: 1.0"
+             data_type="uint64"
+             equation="B 1 READ"
+             underscore_name="counter1"
+             units="events"
+             symbol_name="Counter1"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter2"
+             description="HW test counter 2. Factor: 1.0"
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="counter2"
+             units="events"
+             symbol_name="Counter2"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009840" value="0x00000000" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x280E0000" />
+        <register type="NOA" address="0x00009888" value="0x1E0E0147" />
+        <register type="NOA" address="0x00009888" value="0x180E0000" />
+        <register type="NOA" address="0x00009888" value="0x160E0000" />
+        <register type="NOA" address="0x00009888" value="0x1E0F1000" />
+        <register type="NOA" address="0x00009888" value="0x1E104000" />
+        <register type="NOA" address="0x00009888" value="0x2E020100" />
+        <register type="NOA" address="0x00009888" value="0x2C030004" />
+        <register type="NOA" address="0x00009888" value="0x38003000" />
+        <register type="NOA" address="0x00009888" value="0x1E0A8000" />
+        <register type="NOA" address="0x00009884" value="0x00000003" />
+        <register type="NOA" address="0x00009888" value="0x49110000" />
+        <register type="NOA" address="0x00009888" value="0x5D101400" />
+        <register type="NOA" address="0x00009888" value="0x1D140020" />
+        <register type="NOA" address="0x00009888" value="0x1D1103A3" />
+        <register type="NOA" address="0x00009888" value="0x01110000" />
+        <register type="NOA" address="0x00009888" value="0x61111000" />
+        <register type="NOA" address="0x00009888" value="0x1F128000" />
+        <register type="NOA" address="0x00009888" value="0x17100000" />
+        <register type="NOA" address="0x00009888" value="0x55100630" />
+        <register type="NOA" address="0x00009888" value="0x57100000" />
+        <register type="NOA" address="0x00009888" value="0x31100000" />
+        <register type="NOA" address="0x00009884" value="0x00000003" />
+        <register type="NOA" address="0x00009888" value="0x65100002" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x42000001" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x0000D920" value="0x00000000" />
+        <register type="OA" address="0x0000D900" value="0x00000000" />
+        <register type="OA" address="0x0000D904" value="0xF0800000" />
+        <register type="OA" address="0x0000D910" value="0x00000000" />
+        <register type="OA" address="0x0000D914" value="0xF0800000" />
+        <register type="OA" address="0x0000DC40" value="0x00FF0000" />
+        <register type="OA" address="0x0000D940" value="0x00000004" />
+        <register type="OA" address="0x0000D944" value="0x0000FFFF" />
+        <register type="OA" address="0x0000DC00" value="0x00000004" />
+        <register type="OA" address="0x0000DC04" value="0x0000FFFF" />
+        <register type="OA" address="0x0000D948" value="0x00000003" />
+        <register type="OA" address="0x0000D94C" value="0x0000FFFF" />
+        <register type="OA" address="0x0000DC08" value="0x00000003" />
+        <register type="OA" address="0x0000DC0C" value="0x0000FFFF" />
+        <register type="OA" address="0x0000D950" value="0x00000007" />
+        <register type="OA" address="0x0000D954" value="0x0000FFFF" />
+        <register type="OA" address="0x0000DC10" value="0x00000007" />
+        <register type="OA" address="0x0000DC14" value="0x0000FFFF" />
+        <register type="OA" address="0x0000D958" value="0x00100002" />
+        <register type="OA" address="0x0000D95C" value="0x0000FFF7" />
+        <register type="OA" address="0x0000DC18" value="0x00100002" />
+        <register type="OA" address="0x0000DC1C" value="0x0000FFF7" />
+        <register type="OA" address="0x0000D960" value="0x00100002" />
+        <register type="OA" address="0x0000D964" value="0x0000FFCF" />
+        <register type="OA" address="0x0000DC20" value="0x00100002" />
+        <register type="OA" address="0x0000DC24" value="0x0000FFCF" />
+        <register type="OA" address="0x0000D968" value="0x00100082" />
+        <register type="OA" address="0x0000D96C" value="0x0000FFEF" />
+        <register type="OA" address="0x0000DC28" value="0x00100082" />
+        <register type="OA" address="0x0000DC2C" value="0x0000FFEF" />
+        <register type="OA" address="0x0000D970" value="0x001000C2" />
+        <register type="OA" address="0x0000D974" value="0x0000FFE7" />
+        <register type="OA" address="0x0000DC30" value="0x001000C2" />
+        <register type="OA" address="0x0000DC34" value="0x0000FFE7" />
+        <register type="OA" address="0x0000D978" value="0x00100001" />
+        <register type="OA" address="0x0000D97C" value="0x0000FFE7" />
+        <register type="OA" address="0x0000DC38" value="0x00100001" />
+        <register type="OA" address="0x0000DC3C" value="0x0000FFE7" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E65C" value="0xFFFFFFFF" />
+    </register_config>
+  </set>
+
+</metrics>
diff --git a/lib/i915/perf-configs/oa_guid_registry.py b/lib/i915/perf-configs/oa_guid_registry.py
new file mode 100644
index 00000000..0ed3983f
--- /dev/null
+++ b/lib/i915/perf-configs/oa_guid_registry.py
@@ -0,0 +1,73 @@
+
+import copy
+import hashlib
+
+import xml.etree.ElementTree as et
+
+
+class Registry:
+
+    # Tries to avoid fragility from et.tostring() by normalizing into CSV string first
+    @staticmethod
+    def hw_config_hash(metric_set):
+        """Hashes the given metric set's HW register configs.
+
+        Args:
+            metric_set -- is an ElementTree element for a 'set'
+
+        Note this doesn't accept an MDAPI based metric set description
+        """
+
+        registers_str = ""
+        for config in metric_set.findall(".//register_config"):
+            if config.get('id') == None:
+                config_id = '0'
+            else:
+                config_id = config.get('id')
+            if config.get('priority') == None:
+                config_priority = '0'
+            else:
+                config_priority = config.get('priority')
+            if config.get('availability') == None:
+                config_availability = ""
+            else:
+                config_availability = config.get('availability')
+            for reg in config.findall("register"):
+                addr = int(reg.get('address'), 16)
+                value = int(reg.get('value'), 16)
+                registers_str = registers_str + config_id + ',' + config_priority + ',' + config_availability + ',' + str(addr) + ',' + str(value) + '\n'
+
+        return hashlib.md5(registers_str.encode('utf-8')).hexdigest()
+
+
+    @staticmethod
+    def mdapi_hw_config_hash(mdapi_metric_set):
+        """Hashes the HW register configuration of a metric set from VPG's MDAPI XML files.
+
+        Args:
+            mdapi_metric_set -- is an ElementTree element for a 'MetricSet'
+
+        Note: being a simplistic hash of all RegConfigStart element contents
+        this will change for minor comment changes in VPG's files. Without
+        any promisies of stability within these files then it can't help to
+        err on the side of caution here, so we know when to investigate
+        changes that might affect our useages.
+        """
+
+        config = et.Element('config')
+        for registers in mdapi_metric_set.findall(".//RegConfigStart"):
+            config.append(copy.deepcopy(registers))
+        registers_str = et.tostring(config)
+
+        return hashlib.md5(registers_str).hexdigest()
+
+
+    @staticmethod
+    def chipset_derive_hash(chipset, hash):
+        """Derive a HW config hash for a given chipset.
+
+        This helps us avoiding collisions with identical config across
+        different Gen or GT.
+        """
+
+        return "%s-%s" % (chipset, hash)
diff --git a/lib/i915/perf-configs/perf-codegen.py b/lib/i915/perf-configs/perf-codegen.py
new file mode 100755
index 00000000..c48343b3
--- /dev/null
+++ b/lib/i915/perf-configs/perf-codegen.py
@@ -0,0 +1,850 @@
+#!/usr/bin/env python2
+#
+# Copyright (c) 2015-2018 Intel Corporation
+#
+# Permission is hereby granted, free of charge, to any person obtaining a
+# copy of this software and associated documentation files (the "Software"),
+# to deal in the Software without restriction, including without limitation
+# the rights to use, copy, modify, merge, publish, distribute, sublicense,
+# and/or sell copies of the Software, and to permit persons to whom the
+# Software is furnished to do so, subject to the following conditions:
+#
+# The above copyright notice and this permission notice (including the next
+# paragraph) shall be included in all copies or substantial portions of the
+# Software.
+#
+# THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+# IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+# FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+# THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+# LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+# FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
+# IN THE SOFTWARE.
+
+import argparse
+import os
+import sys
+import textwrap
+
+import xml.etree.cElementTree as et
+
+import codegen
+
+h = None
+c = None
+
+hashed_funcs = {}
+xml_equations = None
+
+def check_operand_type(set, arg):
+    if arg.isdigit():
+        return "\n<mn>" + arg + "</mn>"
+    elif arg[0] == "$":
+        if arg in set.counter_vars:
+            description = set.counter_vars[arg].get('description')
+        elif arg in hw_vars and 'desc' in hw_vars[arg]:
+            description = hw_vars[arg]['desc'];
+        else:
+            description = None
+
+        if description != None:
+            return "\n<maction actiontype='tooltip'>\n<mi>" + arg + "</mi>\n<mtext>" + description + "</mtext>\n</maction>"
+        else:
+            return "<mi>" + arg + "</mi>"
+    return arg
+
+# http://en.cppreference.com/w/c/language/operator_precedence
+and_precedence = 8
+shft_precedence = 5
+mul_precedence = 3
+add_precedence = 2
+sub_precedence = 2
+default_precedence = 16 #a high value which denotes no brackets needed
+
+def put_brackets(arg):
+    return "\n<mtext>(</mtext>" + arg + "\n<mtext>)</mtext>"
+
+def mathml_splice_add(set, args):
+    operand_0 = check_operand_type(set, args[0][0])
+    operand_1 = check_operand_type(set, args[1][0])
+    if args[0][1] < add_precedence:
+        operand_0 = put_brackets(args[0][0])
+    if args[1][1] < add_precedence:
+        operand_1 = put_brackets(args[1][0])
+    return [operand_1 + "\n<mo>+</mo>" + operand_0, add_precedence]
+
+def mathml_splice_div(set, args):
+    operand_0 = check_operand_type(set, args[0][0])
+    operand_1 = check_operand_type(set, args[1][0])
+    return ["\n<mfrac>\n<mrow>" + operand_1 + "\n</mrow>\n<mrow>" + operand_0 + "</mrow>\n</mfrac>", default_precedence]
+
+def mathml_splice_max(set, args):
+    operand_0 = check_operand_type(set, args[0][0])
+    operand_1 = check_operand_type(set, args[1][0])
+    return ["\n<mtext>max ( </mtext>" + operand_1 + "\n<mtext> , </mtext>" + operand_0 + "\n<mtext> ) </mtext>", default_precedence]
+
+def mathml_splice_mul(set, args):
+    operand_0 = check_operand_type(set, args[0][0])
+    operand_1 = check_operand_type(set, args[1][0])
+    if args[0][1] < mul_precedence:
+        operand_0 = put_brackets(args[0][0])
+    if args[1][1] < mul_precedence:
+        operand_1 = put_brackets(args[1][0])
+    return [operand_1 + "\n<mo>*</mo>" + operand_0, mul_precedence]
+
+def mathml_splice_sub(set, args):
+    operand_0 = check_operand_type(set, args[0][0])
+    operand_1 = check_operand_type(set, args[1][0])
+    if args[0][1] < sub_precedence:
+        operand_0 = put_brackets(args[0][0])
+    if args[1][1] < sub_precedence:
+        operand_1 = put_brackets(args[1][0])
+    return [operand_1 + "\n<mo>-</mo>" + operand_0, sub_precedence]
+
+def mathml_splice_read(set, args):
+    return ["\n<maction actiontype='tooltip'>\n<mi>" + args[1][0] + args[0][0] + "</mi>\n<mtext>placeholder</mtext>\n</maction>", default_precedence]
+
+def mathml_splice_read_reg(set, args):
+    return ["\n<maction actiontype='tooltip'>\n<mi>" + args[0][0] + "</mi>\n<mtext>placeholder</mtext>\n</maction>", default_precedence]
+
+def mathml_splice_min(set, args):
+    operand_0 = check_operand_type(set, args[0][0])
+    operand_1 = check_operand_type(set, args[1][0])
+    return ["\n<mtext>min ( </mtext>" + operand_1 + "\n<mtext> , </mtext>" + operand_0 + "\n<mtext> ) </mtext>", default_precedence]
+
+def mathml_splice_lshft(set, args):
+    operand_0 = check_operand_type(set, args[0][0])
+    operand_1 = check_operand_type(set, args[1][0])
+    if args[0][1] < shft_precedence:
+        operand_0 = put_brackets(args[0][0])
+    if args[1][1] < shft_precedence:
+        operand_1 = put_brackets(args[1][0])
+    return [operand_1 + "\n<mo><<</mo>" + operand_0, shft_precedence]
+
+def mathml_splice_rshft(set, args):
+    operand_0 = check_operand_type(set, args[0][0])
+    operand_1 = check_operand_type(set, args[1][0])
+    if args[0][1] < mul_precedence:
+        operand_0 = put_brackets(args[0][0])
+    if args[1][1] < mul_precedence:
+        operand_1 = put_brackets(args[1][0])
+    return [operand_1 + "\n<mo>>></mo>" + operand_0, mul_precedence]
+
+def mathml_splice_and(set, args):
+    operand_0 = check_operand_type(set, args[0][0])
+    operand_1 = check_operand_type(set, args[1][0])
+    if args[0][1] < and_precedence:
+        operand_0 = put_brackets(args[0][0])
+    if args[1][1] < and_precedence:
+        operand_1 = put_brackets(args[1][0])
+    return [operand_1 + "\n<mo>&</mo>" + operand_0, and_precedence]
+
+def emit_fadd(tmp_id, args):
+    c("double tmp{0} = {1} + {2};".format(tmp_id, args[1], args[0]))
+    return tmp_id + 1
+
+# Be careful to check for divide by zero...
+def emit_fdiv(tmp_id, args):
+    c("double tmp{0} = {1};".format(tmp_id, args[1]))
+    c("double tmp{0} = {1};".format(tmp_id + 1, args[0]))
+    c("double tmp{0} = tmp{1} ? tmp{2} / tmp{1} : 0;".format(tmp_id + 2, tmp_id + 1, tmp_id))
+    return tmp_id + 3
+
+def emit_fmax(tmp_id, args):
+    c("double tmp{0} = {1};".format(tmp_id, args[1]))
+    c("double tmp{0} = {1};".format(tmp_id + 1, args[0]))
+    c("double tmp{0} = MAX(tmp{1}, tmp{2});".format(tmp_id + 2, tmp_id, tmp_id + 1))
+    return tmp_id + 3
+
+def emit_fmul(tmp_id, args):
+    c("double tmp{0} = {1} * {2};".format(tmp_id, args[1], args[0]))
+    return tmp_id + 1
+
+def emit_fsub(tmp_id, args):
+    c("double tmp{0} = {1} - {2};".format(tmp_id, args[1], args[0]))
+    return tmp_id + 1
+
+def emit_read(tmp_id, args):
+    type = args[1].lower()
+    c("uint64_t tmp{0} = accumulator[metric_set->{1}_offset + {2}];".format(tmp_id, type, args[0]))
+    return tmp_id + 1
+
+# Disabled here as the generated code is not capturing registers. This
+# will only be useful for query mode where the driver captures
+# additional registers.
+def emit_read_reg(tmp_id, args):
+    c("uint64_t tmp{0} = 0;".format(tmp_id))
+    return tmp_id + 1
+
+def emit_uadd(tmp_id, args):
+    c("uint64_t tmp{0} = {1} + {2};".format(tmp_id, args[1], args[0]))
+    return tmp_id + 1
+
+# Be careful to check for divide by zero...
+def emit_udiv(tmp_id, args):
+    c("uint64_t tmp{0} = {1};".format(tmp_id, args[1]))
+    c("uint64_t tmp{0} = {1};".format(tmp_id + 1, args[0]))
+    c("uint64_t tmp{0} = tmp{1} ? tmp{2} / tmp{1} : 0;".format(tmp_id + 2, tmp_id + 1, tmp_id))
+    return tmp_id + 3
+
+def emit_umul(tmp_id, args):
+    c("uint64_t tmp{0} = {1} * {2};".format(tmp_id, args[1], args[0]))
+    return tmp_id + 1
+
+def emit_usub(tmp_id, args):
+    c("uint64_t tmp{0} = {1} - {2};".format(tmp_id, args[1], args[0]))
+    return tmp_id + 1
+
+def emit_umin(tmp_id, args):
+    c("uint64_t tmp{0} = MIN({1}, {2});".format(tmp_id, args[1], args[0]))
+    return tmp_id + 1
+
+def emit_lshft(tmp_id, args):
+    c("uint64_t tmp{0} = {1} << {2};".format(tmp_id, args[1], args[0]))
+    return tmp_id + 1
+
+def emit_rshft(tmp_id, args):
+    c("uint64_t tmp{0} = {1} >> {2};".format(tmp_id, args[1], args[0]))
+    return tmp_id + 1
+
+def emit_and(tmp_id, args):
+    c("uint64_t tmp{0} = {1} & {2};".format(tmp_id, args[1], args[0]))
+    return tmp_id + 1
+
+ops = {}
+#                     (n operands, emitter1, emitter2)
+ops["FADD"]     = (2, emit_fadd, mathml_splice_add)
+ops["FDIV"]     = (2, emit_fdiv, mathml_splice_div)
+ops["FMAX"]     = (2, emit_fmax, mathml_splice_max)
+ops["FMUL"]     = (2, emit_fmul, mathml_splice_mul)
+ops["FSUB"]     = (2, emit_fsub, mathml_splice_sub)
+ops["READ"]     = (2, emit_read, mathml_splice_read)
+ops["READ_REG"] = (1, emit_read_reg, mathml_splice_read_reg)
+ops["UADD"]     = (2, emit_uadd, mathml_splice_add)
+ops["UDIV"]     = (2, emit_udiv, mathml_splice_div)
+ops["UMUL"]     = (2, emit_umul, mathml_splice_mul)
+ops["USUB"]     = (2, emit_usub, mathml_splice_sub)
+ops["UMIN"]     = (2, emit_umin, mathml_splice_min)
+ops["<<"]       = (2, emit_lshft, mathml_splice_lshft)
+ops[">>"]       = (2, emit_rshft, mathml_splice_rshft)
+ops["AND"]      = (2, emit_and, mathml_splice_and)
+
+def brkt(subexp):
+    if " " in subexp:
+        return "(" + subexp + ")"
+    else:
+        return subexp
+
+def splice_bitwise_and(args):
+    return brkt(args[1]) + " & " + brkt(args[0])
+
+def splice_logical_and(args):
+    return brkt(args[1]) + " && " + brkt(args[0])
+
+def splice_ult(args):
+    return brkt(args[1]) + " < " + brkt(args[0])
+
+def splice_ugte(args):
+    return brkt(args[1]) + " >= " + brkt(args[0])
+
+exp_ops = {}
+#                 (n operands, splicer)
+exp_ops["AND"]  = (2, splice_bitwise_and)
+exp_ops["UGTE"] = (2, splice_ugte)
+exp_ops["ULT"]  = (2, splice_ult)
+exp_ops["&&"]   = (2, splice_logical_and)
+
+
+hw_vars = {
+        "$EuCoresTotalCount": { 'c': "perf->devinfo.n_eus", 'desc': "The total number of execution units" },
+        "$EuSlicesTotalCount": { 'c': "perf->devinfo.n_eu_slices" },
+        "$EuSubslicesTotalCount": { 'c': "perf->devinfo.n_eu_sub_slices" },
+        "$EuThreadsCount": { 'c': "perf->devinfo.eu_threads_count" },
+        "$SliceMask": { 'c': "perf->devinfo.slice_mask" },
+        "$DualSubsliceMask": { 'c': "perf->devinfo.subslice_mask" },
+        "$SubsliceMask": { 'c': "perf->devinfo.subslice_mask" },
+        "$GpuTimestampFrequency": { 'c': "perf->devinfo.timestamp_frequency" },
+        "$GpuMinFrequency": { 'c': "perf->devinfo.gt_min_freq" },
+        "$GpuMaxFrequency": { 'c': "perf->devinfo.gt_max_freq" },
+        "$SkuRevisionId": { 'c': "perf->devinfo.revision" },
+        "$QueryMode": { 'c': "perf->devinfo.query_mode" },
+}
+
+def splice_mathml_expression(set, equation, tag):
+    tokens = equation.split()
+    mathml_stack = []
+    tmp_xml_operand = ""
+    for token in tokens:
+        if not mathml_stack:
+            token = check_operand_type(set, token)
+        mathml_stack.append([token, default_precedence])
+        while mathml_stack and mathml_stack[-1][0] in ops:
+            op = mathml_stack.pop()[0]
+            argc, callback, mathml_callback = ops[op]
+            xml_args = []
+            for i in range(0, argc):
+                xml_operand = mathml_stack.pop()
+                xml_args.append(xml_operand)
+            tmp_xml_operand = mathml_callback(set, xml_args)
+            mathml_stack.append(tmp_xml_operand)
+    xml_string = mathml_stack.pop()[0]
+    equation_descr = "<mi>" + tag + "</mi><mo> = </mo>"
+    return "<mathml_" + tag + ">" + equation_descr + xml_string + "</mathml_" + tag + ">"
+
+def output_rpn_equation_code(set, counter, equation):
+    c("/* RPN equation: " + equation + " */")
+    tokens = equation.split()
+    stack = []
+    tmp_id = 0
+    tmp = None
+
+    for token in tokens:
+        stack.append(token)
+        while stack and stack[-1] in ops:
+            op = stack.pop()
+            argc, callback, mathml_callback = ops[op]
+            args = []
+            for i in range(0, argc):
+                operand = stack.pop()
+                if operand[0] == "$":
+                    if operand in hw_vars:
+                        operand = hw_vars[operand]['c']
+                    elif operand in set.counter_vars:
+                        reference = set.counter_vars[operand]
+                        operand = set.read_funcs[operand[1:]] + "(perf, metric_set, accumulator)"
+                    else:
+                        raise Exception("Failed to resolve variable " + operand + " in equation " + equation + " for " + set.name + " :: " + counter.get('name'));
+                args.append(operand)
+
+            tmp_id = callback(tmp_id, args)
+
+            tmp = "tmp{0}".format(tmp_id - 1)
+            stack.append(tmp)
+
+    if len(stack) != 1:
+        raise Exception("Spurious empty rpn code for " + set.name + " :: " +
+                counter.get('name') + ".\nThis is probably due to some unhandled RPN function, in the equation \"" +
+                equation + "\"")
+
+    value = stack[-1]
+
+    if value in hw_vars:
+        value = hw_vars[value]['c']
+    if value in set.counter_vars:
+        value = set.read_funcs[value[1:]] + "(perf, metric_set, accumulator)"
+
+    c("\nreturn " + value + ";")
+
+def splice_rpn_expression(set, counter_name, expression):
+    tokens = expression.split()
+    stack = []
+
+    for token in tokens:
+        stack.append(token)
+        while stack and stack[-1] in exp_ops:
+            op = stack.pop()
+            argc, callback = exp_ops[op]
+            args = []
+            for i in range(0, argc):
+                operand = stack.pop()
+                if operand[0] == "$":
+                    if operand in hw_vars:
+                        operand = hw_vars[operand]['c']
+                    else:
+                        raise Exception("Failed to resolve variable " + operand + " in expression " + expression + " for " + set.name + " :: " + counter_name)
+                args.append(operand)
+
+            subexp = callback(args)
+
+            stack.append(subexp)
+
+    if len(stack) != 1:
+        raise Exception("Spurious empty rpn expression for " + set.name + " :: " +
+                counter_name + ".\nThis is probably due to some unhandled RPN operation, in the expression \"" +
+                expression + "\"")
+
+    return stack[-1]
+
+
+def data_type_to_ctype(ret_type):
+    if ret_type == "uint64":
+        return "uint64_t"
+    elif ret_type == "float":
+        return "double"
+    else:
+        raise Exception("Unhandled case for mapping \"" + ret_type + "\" to a C type")
+
+
+def output_counter_read(gen, set, counter):
+    c("\n")
+    c("/* {0} :: {1} */".format(set.name, counter.get('name')))
+
+    if counter.read_hash in hashed_funcs:
+        c("#define %s \\" % counter.read_sym)
+        c.indent(4)
+        c("%s" % hashed_funcs[counter.read_hash])
+        c.outdent(4)
+    else:
+        ret_type = counter.get('data_type')
+        ret_ctype = data_type_to_ctype(ret_type)
+        read_eq = counter.get('equation')
+
+        c("static " + ret_ctype)
+        c(counter.read_sym + "(const struct intel_perf *perf,\n")
+        c.indent(len(counter.read_sym) + 1)
+        c("const struct intel_perf_metric_set *metric_set,\n")
+        c("uint64_t *accumulator)\n")
+        c.outdent(len(counter.read_sym) + 1)
+
+        c("{")
+        c.indent(4)
+
+        output_rpn_equation_code(set, counter, read_eq)
+
+        c.outdent(4)
+        c("}")
+
+        hashed_funcs[counter.read_hash] = counter.read_sym
+
+
+def output_counter_max(gen, set, counter):
+    max_eq = counter.get('max_equation')
+
+    if not max_eq or max_eq == "100":
+        return
+
+    c("\n")
+    c("/* {0} :: {1} */".format(set.name, counter.get('name')))
+
+    if counter.max_hash in hashed_funcs:
+        c("#define %s \\" % counter.max_sym)
+        c.indent(4)
+        c("%s" % hashed_funcs[counter.max_hash])
+        c.outdent(4)
+    else:
+        ret_type = counter.get('data_type')
+        ret_ctype = data_type_to_ctype(ret_type)
+
+        c("static " + ret_ctype)
+
+        c(counter.max_sym + "(const struct intel_perf *perf,\n")
+        c.indent(len(counter.max_sym) + 1)
+        c("const struct intel_perf_metric_set *metric_set,\n")
+        c("uint64_t *accumulator)\n")
+        c.outdent(len(counter.max_sym) + 1)
+
+        c("{")
+        c.indent(4)
+
+        output_rpn_equation_code(set, counter, max_eq)
+
+        c.outdent(4)
+        c("}")
+
+        hashed_funcs[counter.max_hash] = counter.max_sym
+
+
+semantic_type_map = {
+    "duration": "raw",
+    "ratio": "event"
+    }
+
+def output_availability(set, availability, counter_name):
+    expression = splice_rpn_expression(set, counter_name, availability)
+    lines = expression.split(' && ')
+    n_lines = len(lines)
+    if n_lines == 1:
+        c("if (" + lines[0] + ") {")
+    else:
+        c("if (" + lines[0] + " &&")
+        c.indent(4)
+        for i in range(1, (n_lines - 1)):
+            c(lines[i] + " &&")
+        c(lines[(n_lines - 1)] + ") {")
+        c.outdent(4)
+
+
+def output_units(unit):
+    return unit.replace(' ', '_').upper()
+
+
+def output_counter_report(set, counter):
+    data_type = counter.get('data_type')
+    data_type_uc = data_type.upper()
+    c_type = data_type
+
+    if "uint" in c_type:
+        c_type = c_type + "_t"
+
+    semantic_type = counter.get('semantic_type')
+    if semantic_type in semantic_type_map:
+        semantic_type = semantic_type_map[semantic_type]
+
+    semantic_type_uc = semantic_type.upper()
+
+    c("\n")
+
+    availability = counter.get('availability')
+    if availability:
+        output_availability(set, availability, counter.get('name'))
+        c.indent(4)
+
+    c("counter = &metric_set->counters[metric_set->n_counters++];\n")
+    c("counter->metric_set = metric_set;\n")
+    c("counter->name = \"{0}\";\n".format(counter.get('name')))
+    c("counter->symbol_name = \"{0}\";\n".format(counter.get('symbol_name')));
+    c("counter->desc = \"{0}\";\n".format(counter.get('description')))
+    c("counter->type = INTEL_PERF_LOGICAL_COUNTER_TYPE_{0};\n".format(semantic_type_uc))
+    c("counter->storage = INTEL_PERF_LOGICAL_COUNTER_STORAGE_{0};\n".format(data_type_uc))
+    c("counter->unit = INTEL_PERF_LOGICAL_COUNTER_UNIT_{0};\n".format(output_units(counter.get('units'))))
+    c("counter->read_{0} = {1};\n".format(data_type, set.read_funcs[counter.get('symbol_name')]))
+    c("counter->max_{0} = {1};\n".format(data_type, set.max_funcs[counter.get('symbol_name')]))
+    c("intel_perf_add_logical_counter(perf, counter, \"{0}\");\n".format(counter.get('mdapi_group')))
+
+    if availability:
+        c.outdent(4)
+        c("}\n")
+
+
+def generate_register_configs(set):
+    register_types = {
+        'FLEX': 'flex_regs',
+        'NOA': 'mux_regs',
+        'OA': 'b_counter_regs',
+    }
+
+    # allocate memory
+    total_n_registers = {}
+    register_configs = set.findall('register_config')
+    for register_config in register_configs:
+        t = register_types[register_config.get('type')]
+        if t not in total_n_registers:
+            total_n_registers[t] = len(register_config.findall('register'))
+        else:
+            total_n_registers[t] += len(register_config.findall('register'))
+
+    for reg in total_n_registers:
+        c("metric_set->{0} = calloc({1}, sizeof(struct intel_perf_register_prog));".format(reg, total_n_registers[reg]))
+    c("\n")
+
+    # fill in register/values
+    register_configs = set.findall('register_config')
+    for register_config in register_configs:
+        t = register_types[register_config.get('type')]
+
+        availability = register_config.get('availability')
+        if availability:
+            output_availability(set, availability, register_config.get('type') + ' register config')
+            c.indent(4)
+
+        for register in register_config.findall('register'):
+            c("metric_set->%s[metric_set->n_%s++] = (struct intel_perf_register_prog) { .reg = %s, .val = %s };" %
+              (t, t, register.get('address'), register.get('value')))
+
+        if availability:
+            c.outdent(4)
+            c("}")
+        c("\n")
+
+#
+
+class Counter:
+    def __init__(self, set, xml):
+        self.xml = xml
+        self.set = set
+        self.read_hash = None
+        self.max_hash = None
+
+        self.read_sym = "{0}__{1}__{2}__read".format(self.set.gen.chipset,
+                                                     self.set.underscore_name,
+                                                     self.xml.get('underscore_name'))
+
+        max_eq = self.xml.get('max_equation')
+        if not max_eq:
+            self.max_sym = "NULL /* undefined */"
+        elif max_eq == "100":
+            self.max_sym = "percentage_max_callback_" + self.xml.get('data_type')
+        else:
+            self.max_sym = "{0}__{1}__{2}__max".format(self.set.gen.chipset,
+                                                       self.set.underscore_name,
+                                                       self.xml.get('underscore_name'))
+
+    def get(self, prop):
+        return self.xml.get(prop)
+
+    def compute_hashes(self):
+        if self.read_hash is not None:
+            return
+
+        def replace_func(token):
+            if token[0] != "$":
+                return token
+            if token not in self.set.counter_vars:
+                return token
+            self.set.counter_vars[token].compute_hashes()
+            return self.set.counter_vars[token].read_hash
+
+        read_eq = self.xml.get('equation')
+        self.read_hash = ' '.join(map(replace_func, read_eq.split()))
+
+        max_eq = self.xml.get('max_equation')
+        if max_eq:
+            self.max_hash = ' '.join(map(replace_func, max_eq.split()))
+
+
+class Set:
+    def __init__(self, gen, xml):
+        self.gen = gen
+        self.xml = xml
+
+        self.counter_vars = {}
+        self.max_funcs = {}
+        self.read_funcs = {}
+        self.counter_hashes = {}
+
+        self.counters = []
+        xml_counters = self.xml.findall("counter")
+        for xml_counter in xml_counters:
+            counter = Counter(self, xml_counter)
+            self.counters.append(counter)
+            self.counter_vars["$" + counter.get('symbol_name')] = counter
+            self.max_funcs[counter.get('symbol_name')] = counter.max_sym
+            self.read_funcs[counter.get('symbol_name')] = counter.read_sym
+
+        for counter in self.counters:
+            counter.compute_hashes()
+
+    @property
+    def hw_config_guid(self):
+        return self.xml.get('hw_config_guid')
+
+    @property
+    def name(self):
+        return self.xml.get('name')
+
+    @property
+    def symbol_name(self):
+        return self.xml.get('symbol_name')
+
+    @property
+    def underscore_name(self):
+        return self.xml.get('underscore_name')
+
+    def findall(self, path):
+        return self.xml.findall(path)
+
+    def find(self, path):
+        return self.xml.find(path)
+
+
+class Gen:
+    def __init__(self, filename):
+        self.filename = filename
+        self.xml = et.parse(self.filename)
+        self.chipset = self.xml.find('.//set').get('chipset').lower()
+        self.sets = []
+
+        for xml_set in self.xml.findall(".//set"):
+            self.sets.append(Set(self, xml_set))
+
+
+def main():
+    global c
+    global h
+    global xml_equations
+
+    parser = argparse.ArgumentParser()
+    parser.add_argument("--header", help="Header file to write")
+    parser.add_argument("--code", help="C file to write")
+    parser.add_argument("--xml-out", help="Output XML files (adding mathml equations)")
+    parser.add_argument("xml_files", nargs='+', help="List of xml metrics files to process")
+
+    args = parser.parse_args()
+
+    # Note: either arg may == None
+    h = codegen.Codegen(args.header)
+    c = codegen.Codegen(args.code)
+
+    gens = []
+    for xml_file in args.xml_files:
+        gens.append(Gen(xml_file))
+
+    if args.xml_out:
+        for gen in gens:
+            for set in gen.sets:
+                for counter in set.counters:
+                    xml_equation = splice_mathml_expression(set, counter.get('equation'), "EQ")
+                    counter.append(et.fromstring(xml_equation))
+            gen.xml.write(gen.filename)
+
+
+    copyright = textwrap.dedent("""\
+        /* Autogenerated file, DO NOT EDIT manually! generated by {}
+         *
+         * Copyright (c) 2018 Intel Corporation
+         *
+         * Permission is hereby granted, free of charge, to any person obtaining a
+         * copy of this software and associated documentation files (the "Software"),
+         * to deal in the Software without restriction, including without limitation
+         * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+         * and/or sell copies of the Software, and to permit persons to whom the
+         * Software is furnished to do so, subject to the following conditions:
+         *
+         * The above copyright notice and this permission notice (including the next
+         * paragraph) shall be included in all copies or substantial portions of the
+         * Software.
+         *
+         * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+         * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+         * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+         * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+         * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+         * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+         * DEALINGS IN THE SOFTWARE.
+         */
+
+        """).format(os.path.basename(__file__))
+
+    h(copyright)
+    c(copyright)
+    c(textwrap.dedent("""\
+        #include <stddef.h>
+        #include <stdint.h>
+        #include <stdbool.h>
+        #include <assert.h>
+
+        """))
+
+    c("#include \"" + os.path.basename(args.header) + "\"")
+
+    c(textwrap.dedent("""\
+        #include <stdlib.h>
+        #include <string.h>
+
+        #include <i915_drm.h>
+
+        #include "i915/perf.h"
+
+        #define MIN(x, y) (((x) < (y)) ? (x) : (y))
+        #define MAX(a, b) (((a) > (b)) ? (a) : (b))
+
+        static double
+        percentage_max_callback_float(const struct intel_perf *perf,
+                                      const struct intel_perf_metric_set *metric_set,
+                                      uint64_t *accumulator)
+        {
+           return 100;
+        }
+
+        static uint64_t
+        percentage_max_callback_uint64(const struct intel_perf *perf,
+                                       const struct intel_perf_metric_set *metric_set,
+                                       uint64_t *accumulator)
+        {
+           return 100;
+        }
+
+        """))
+
+    # Print out all equation functions.
+    for gen in gens:
+        for set in gen.sets:
+            for counter in set.counters:
+                output_counter_read(gen, set, counter)
+                output_counter_max(gen, set, counter)
+
+    # Print out all set registration functions for each set in each
+    # generation.
+    for gen in gens:
+        for set in gen.sets:
+            c("\nstatic void\n")
+            c(gen.chipset + "_add_" + set.underscore_name + "_metric_set(struct intel_perf *perf)")
+            c("{\n")
+            c.indent(4)
+
+            c("struct intel_perf_metric_set *metric_set;\n")
+            c("struct intel_perf_logical_counter *counter;\n\n")
+
+            counters = sorted(set.counters, key=lambda k: k.get('symbol_name'))
+
+            c("metric_set = calloc(1, sizeof(*metric_set));\n")
+            c("metric_set->name = \"" + set.name + "\";\n")
+            c("metric_set->symbol_name = \"" + set.symbol_name + "\";\n")
+            c("metric_set->hw_config_guid = \"" + set.hw_config_guid + "\";\n")
+            c("metric_set->counters = calloc({0}, sizeof(struct intel_perf_logical_counter));\n".format(str(len(counters))))
+            c("metric_set->n_counters = 0;\n")
+            c("metric_set->perf_oa_metrics_set = 0; // determined at runtime\n")
+
+            if gen.chipset == "hsw":
+                c(textwrap.dedent("""\
+                    metric_set->perf_oa_format = I915_OA_FORMAT_A45_B8_C8;
+
+                    metric_set->perf_raw_size = 256;
+                    metric_set->gpu_time_offset = 0;
+                    metric_set->a_offset = 1;
+                    metric_set->b_offset = metric_set->a_offset + 45;
+                    metric_set->c_offset = metric_set->b_offset + 8;
+
+                    """))
+            else:
+                c(textwrap.dedent("""\
+                    metric_set->perf_oa_format = I915_OA_FORMAT_A32u40_A4u32_B8_C8;
+
+                    metric_set->perf_raw_size = 256;
+                    metric_set->gpu_time_offset = 0;
+                    metric_set->gpu_clock_offset = 1;
+                    metric_set->a_offset = 2;
+                    metric_set->b_offset = metric_set->a_offset + 36;
+                    metric_set->c_offset = metric_set->b_offset + 8;
+
+                    """))
+
+            c("intel_perf_add_metric_set(perf, metric_set);");
+            c("\n")
+
+            generate_register_configs(set)
+
+            for counter in counters:
+                output_counter_report(set, counter)
+
+            c("\nassert(metric_set->n_counters <= {0});\n".format(len(counters)));
+
+            c.outdent(4)
+            c("}\n")
+
+    h(textwrap.dedent("""\
+        #pragma once
+
+        #include "i915/perf.h"
+
+        #ifdef __cplusplus
+        extern "C" {
+        #endif
+
+        """))
+
+    # Print out all set registration functions for each generation.
+    for gen in gens:
+        h("void intel_perf_load_metrics_" + gen.chipset + "(struct intel_perf *perf);\n\n")
+
+        c("\nvoid")
+        c("intel_perf_load_metrics_" + gen.chipset + "(struct intel_perf *perf)")
+        c("{")
+        c.indent(4)
+
+        for set in gen.sets:
+            c("{0}_add_{1}_metric_set(perf);".format(gen.chipset, set.underscore_name))
+
+        c.outdent(4)
+        c("}")
+
+    h(textwrap.dedent("""\
+        #ifdef __cplusplus
+        } /* extern C */
+        #endif
+
+        """))
+
+
+if __name__ == '__main__':
+    main()
diff --git a/lib/i915/perf-configs/update-guids.py b/lib/i915/perf-configs/update-guids.py
new file mode 100755
index 00000000..c507cb7e
--- /dev/null
+++ b/lib/i915/perf-configs/update-guids.py
@@ -0,0 +1,231 @@
+#!/usr/bin/env python2
+# coding=utf-8
+
+# Copyright (C) 2016 Intel Corporation
+#
+# Permission is hereby granted, free of charge, to any person obtaining a copy
+# of this software and associated documentation files (the "Software"), to deal
+# in the Software without restriction, including without limitation the rights
+# to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+# copies of the Software, and to permit persons to whom the Software is
+# furnished to do so, subject to the following conditions:
+#
+# The above copyright notice and this permission notice shall be included in
+# all copies or substantial portions of the Software.
+#
+# THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+# IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+# FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+# AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+# LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+# OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+# SOFTWARE.
+
+# This script can:
+#
+# - Automatically add template entries for unregistered metric sets diescovered
+#   in new mdapi xml files.
+# - Once mdapi-convert-xml.py has been run to output register configs for new
+#   metric sets then re-running this script can add the config_hash attribute
+#   to corresponding registry entries.
+#
+# The script is designed to allow incremental updates/fixups of the guid
+# registry by working in terms of:
+#
+# 1) load all the existing state
+# 2) apply tweaks/modifications
+# 3) write everything back out
+#
+# The script should gracefully handle incomplete guid entries, which is
+# important when considering how the mdapi-xml-convert.py script depends on the
+# 'mdapi_config_hash' attribute while adding the 'config_hash' attribute
+# depends on the configs output by mdapi-xml-convert.py.
+
+
+
+import argparse
+import os.path
+import re
+import sys
+import time
+import uuid
+
+import xml.etree.ElementTree as et
+import xml.sax.saxutils as saxutils
+
+import oa_guid_registry as oa_registry
+
+
+def print_err(*args):
+    sys.stderr.write(' '.join(map(str,args)) + '\n')
+
+def guid_hashing_key(guid_obj):
+    return oa_registry.Registry.chipset_derive_hash(guid_obj['chipset'],
+                                                    guid_obj['mdapi_config_hash'])
+
+parser = argparse.ArgumentParser()
+parser.add_argument("xml", nargs="+", help="XML description of metrics")
+parser.add_argument("--guids", required=True, help="Metric set GUID registry")
+
+args = parser.parse_args()
+
+
+guids = []
+guid_index = {} # guid objects indexed by id
+mdapi_config_hash_guid_table = {} # indexed by MDAPI XML register config hash
+named_guid_table = {} # indexed by name=<chipset>_<symbol_name>
+
+
+
+# 1) read everything we have currently
+#
+guids_xml = et.parse(args.guids)
+for guid in guids_xml.findall(".//guid"):
+    guid_obj = {}
+
+    if guid.get('id') != None:
+        guid_obj['id'] = guid.get('id')
+    else:
+        guid_obj['id'] = str(uuid.uuid4())
+
+    if guid.get('mdapi_config_hash') != None:
+        guid_obj['mdapi_config_hash'] = guid.get('mdapi_config_hash')
+    if guid.get('config_hash') != None:
+        guid_obj['config_hash'] = guid.get('config_hash')
+
+    if guid.get('chipset') != None:
+        guid_obj['chipset'] = guid.get('chipset')
+    if guid.get('name') != None:
+        guid_obj['name'] = guid.get('name')
+        named_guid_table[guid_obj['chipset'] + "_" + guid_obj['name']] = guid_obj
+
+    if 'mdapi_config_hash' in guid_obj:
+        hashing_key = oa_registry.Registry.chipset_derive_hash(guid_obj['chipset'],
+                                                               guid_obj['mdapi_config_hash'])
+        mdapi_config_hash_guid_table[hashing_key] = guid_obj
+
+    guids.append(guid_obj)
+
+    if guid_obj['id'] in guid_index:
+        print_err("Duplicate GUID " + guid_obj['id'] + "!")
+        sys.exit(1)
+    guid_index[guid_obj['id']] = guid_obj
+
+
+#
+# 2) fixup/modify the guid entries...
+#
+
+
+for arg in args.xml:
+    internal = et.parse(arg)
+
+    concurrent_group = internal.find(".//ConcurrentGroup")
+
+    for mdapi_set in internal.findall(".//MetricSet"):
+
+        mdapi_config_hash = oa_registry.Registry.mdapi_hw_config_hash(mdapi_set)
+
+        chipset = mdapi_set.get('SupportedHW').lower()
+        if concurrent_group.get('SupportedGT') != None:
+            chipset = chipset + concurrent_group.get('SupportedGT').lower()
+
+        set_name = mdapi_set.get('SymbolName')
+
+        name = chipset + "_" + set_name;
+
+        hashing_key = oa_registry.Registry.chipset_derive_hash(chipset, mdapi_config_hash)
+        if hashing_key in mdapi_config_hash_guid_table:
+            guid_obj = mdapi_config_hash_guid_table[hashing_key]
+
+            guid_obj['name'] = set_name
+            guid_obj['chipset'] = chipset
+            guid_obj['matched_mdapi'] = True
+        elif name in named_guid_table:
+            guid_obj = named_guid_table[name]
+
+            guid_obj['matched_mdapi'] = True
+            guid_obj['mdapi_config_hash'] = mdapi_config_hash
+            if 'config_hash' in guid_obj:
+                del guid_obj['config_hash']
+            guid_obj['comment'] = "WARNING: MDAPI XML config hash changed! If upstream, double check raw counter semantics unchanged"
+            print_err("WARNING: MDAPI XML config hash changed for \"" + set_name + "\" (" + chipset + ") If upstream, double check raw counter semantics unchanged")
+        else:
+            guid_obj = { 'mdapi_config_hash': mdapi_config_hash,
+                         'id': str(uuid.uuid4()),
+                         'name': set_name,
+                         'chipset': chipset,
+                         'unregistered': True,
+                         'matched_mdapi': True,
+                         'comment': "New"
+                       }
+            guid_index[guid_obj['id']] = guid_obj
+            mdapi_config_hash_guid_table[guid_hashing_key(guid_obj)] = guid_obj
+            guids.append(guid_obj)
+            print_err("New GUID \"" + guid_obj['id'] + "\" for metric set = " + set_name + " (" + chipset + ")")
+
+        named_guid_table[chipset + '_' + set_name] = guid_obj
+
+
+
+chipsets = [ 'hsw',
+             'bdw', 'chv',
+             'sklgt2', 'sklgt3', 'sklgt4', 'kblgt2', 'kblgt3', 'cflgt2', 'cflgt3',
+             'bxt', 'glk',
+             'cnl',
+             'icl', 'lkf',
+             'tgl' ]
+
+for chipset in chipsets:
+    filename = 'oa-' + chipset + '.xml'
+    if not os.path.isfile(filename):
+        continue
+
+    public = et.parse(filename)
+
+    for metricset in public.findall(".//set"):
+
+        set_name = metricset.get('symbol_name')
+
+        config_hash = oa_registry.Registry.hw_config_hash(metricset)
+
+        guid_key = chipset + "_" + set_name
+        if guid_key in named_guid_table:
+            guid_obj = named_guid_table[guid_key]
+            guid_obj['config_hash'] = config_hash
+
+
+#
+# 3) write all the guids back out...
+
+print("<guids>")
+for guid_obj in guids:
+    comment = None
+    line = "<guid"
+
+    if 'matched_mdapi' not in guid_obj:
+        comment = "Not found in MDAPI XML file[s]; Entry copied unmodified (maybe removed from MDAPI XML or not all files given on command line)"
+
+    if 'comment' in guid_obj:
+        comment = guid_obj['comment']
+
+    if 'config_hash' in guid_obj:
+        line = line + ' config_hash="' + guid_obj['config_hash'] + '"'
+    if 'mdapi_config_hash' in guid_obj:
+        line = line + ' mdapi_config_hash="' + guid_obj['mdapi_config_hash'] + '"'
+
+    line = line + ' id="' + guid_obj['id'] + '"'
+
+    if 'chipset' in guid_obj:
+        line = line + ' chipset="' + guid_obj['chipset'] + '"'
+
+    if 'name' in guid_obj:
+        line = line + ' name="' + guid_obj['name'] + '"'
+
+    line = line + ' />'
+
+    if comment != None:
+        print("    <!-- ↓" + comment + " -->")
+
+    print("    " + line)
+print("</guids>")
diff --git a/lib/i915/perf.c b/lib/i915/perf.c
new file mode 100644
index 00000000..31888627
--- /dev/null
+++ b/lib/i915/perf.c
@@ -0,0 +1,424 @@
+/*
+ * Copyright (C) 2018 Intel Corporation
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a copy
+ * of this software and associated documentation files (the "Software"), to deal
+ * in the Software without restriction, including without limitation the rights
+ * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+ * copies of the Software, and to permit persons to whom the Software is
+ * furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+ * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+ * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+ * SOFTWARE.
+ */
+
+#include <assert.h>
+#include <errno.h>
+#include <stdio.h>
+#include <stdlib.h>
+#include <string.h>
+#include <dirent.h>
+#include <fcntl.h>
+#include <sys/ioctl.h>
+#include <sys/stat.h>
+#include <sys/sysmacros.h>
+#include <sys/types.h>
+#include <unistd.h>
+
+#include <i915_drm.h>
+
+#include "intel_chipset.h"
+#include "perf.h"
+#include "i915_perf_metrics.h"
+
+static struct intel_perf_logical_counter_group *
+intel_perf_logical_counter_group_new(struct intel_perf *perf,
+				     struct intel_perf_logical_counter_group *parent,
+				     const char *name)
+{
+	struct intel_perf_logical_counter_group *group = calloc(1, sizeof(*group));
+
+	group->name = strdup(name);
+
+	IGT_INIT_LIST_HEAD(&group->counters);
+	IGT_INIT_LIST_HEAD(&group->groups);
+
+	if (parent)
+		igt_list_add_tail(&group->link, &parent->groups);
+	else
+		IGT_INIT_LIST_HEAD(&group->link);
+
+	return group;
+}
+
+static void
+intel_perf_logical_counter_group_free(struct intel_perf_logical_counter_group *group)
+{
+	struct intel_perf_logical_counter_group *child, *tmp;
+
+	igt_list_for_each_entry_safe(child, tmp, &group->groups, link) {
+		igt_list_del(&child->link);
+		intel_perf_logical_counter_group_free(child);
+	}
+
+	free(group->name);
+	free(group);
+}
+
+static void
+intel_perf_metric_set_free(struct intel_perf_metric_set *metric_set)
+{
+	free(metric_set->counters);
+	free(metric_set);
+}
+
+static bool
+slice_available(const struct drm_i915_query_topology_info *topo,
+		int s)
+{
+	return (topo->data[s / 8] >> (s % 8)) & 1;
+}
+
+static bool
+subslice_available(const struct drm_i915_query_topology_info *topo,
+		   int s, int ss)
+{
+	return (topo->data[topo->subslice_offset +
+			   s * topo->subslice_stride +
+			   ss / 8] >> (ss % 8)) & 1;
+}
+
+static bool
+eu_available(const struct drm_i915_query_topology_info *topo,
+	     int s, int ss, int eu)
+{
+	return (topo->data[topo->eu_offset +
+			   (s * topo->max_subslices + ss) * topo->eu_stride +
+			   eu / 8] >> (eu % 8)) & 1;
+}
+
+struct intel_perf *
+intel_perf_for_devinfo(uint32_t device_id,
+		       uint32_t revision,
+		       uint64_t timestamp_frequency,
+		       uint64_t gt_min_freq,
+		       uint64_t gt_max_freq,
+		       const struct drm_i915_query_topology_info *topology)
+{
+	const struct intel_device_info *devinfo = intel_get_device_info(device_id);
+	struct intel_perf *perf;
+	int bits_per_subslice;
+
+	if (!devinfo)
+		return NULL;
+
+	perf = calloc(1, sizeof(*perf));;
+	perf->root_group = intel_perf_logical_counter_group_new(perf, NULL, "");
+
+	IGT_INIT_LIST_HEAD(&perf->metric_sets);
+
+	/* Initialize the device characterists first. Loading the
+	 * metrics uses that information to detect whether some
+	 * counters are available on a given device (for example BXT
+	 * 2x6 does not have 2 samplers).
+	 */
+	perf->devinfo.devid = device_id;
+	perf->devinfo.revision = revision;
+	perf->devinfo.timestamp_frequency = timestamp_frequency;
+	perf->devinfo.gt_min_freq = gt_min_freq;
+	perf->devinfo.gt_max_freq = gt_max_freq;
+
+	/* On Gen11+ the equations from the xml files expect an 8bits
+	 * mask per subslice, versus only 3bits on prior Gens.
+	 */
+	bits_per_subslice = devinfo->gen >= 11 ? 8 : 3;
+	for (uint32_t s = 0; s < topology->max_slices; s++) {
+		if (!slice_available(topology, s))
+			continue;
+
+		perf->devinfo.slice_mask |= 1ULL << s;
+		for (uint32_t ss = 0; ss < topology->max_subslices; ss++) {
+			if (!subslice_available(topology, 0, s))
+				continue;
+
+			perf->devinfo.subslice_mask |= 1ULL << (s * bits_per_subslice + ss);
+
+			for (uint32_t eu = 0; eu < topology->max_eus_per_subslice; eu++) {
+				if (eu_available(topology, s, ss, eu))
+					perf->devinfo.n_eus++;
+			}
+		}
+	}
+
+	perf->devinfo.n_eu_slices = __builtin_popcount(perf->devinfo.slice_mask);
+	perf->devinfo.n_eu_sub_slices = __builtin_popcount(perf->devinfo.subslice_mask);
+
+	/* Valid on most generations except Gen9LP. */
+	perf->devinfo.eu_threads_count = 7;
+
+	if (devinfo->is_haswell) {
+		intel_perf_load_metrics_hsw(perf);
+	} else if (devinfo->is_broadwell) {
+		intel_perf_load_metrics_bdw(perf);
+	} else if (devinfo->is_cherryview) {
+		intel_perf_load_metrics_chv(perf);
+	} else if (devinfo->is_skylake) {
+		switch (devinfo->gt) {
+		case 2:
+			intel_perf_load_metrics_sklgt2(perf);
+			break;
+		case 3:
+			intel_perf_load_metrics_sklgt3(perf);
+			break;
+		case 4:
+			intel_perf_load_metrics_sklgt4(perf);
+			break;
+		default:
+			assert(0); /* unreachable */
+		}
+	} else if (devinfo->is_broxton) {
+		perf->devinfo.eu_threads_count = 6;
+		intel_perf_load_metrics_bxt(perf);
+	} else if (devinfo->is_kabylake) {
+		switch (devinfo->gt) {
+		case 2:
+			intel_perf_load_metrics_kblgt2(perf);
+			break;
+		case 3:
+			intel_perf_load_metrics_kblgt3(perf);
+			break;
+		default:
+			assert(0); /* unreachable */
+		}
+	} else if (devinfo->is_geminilake) {
+		perf->devinfo.eu_threads_count = 6;
+		intel_perf_load_metrics_glk(perf);
+	} else if (devinfo->is_coffeelake) {
+		switch (devinfo->gt) {
+		case 2:
+			intel_perf_load_metrics_cflgt2(perf);
+			break;
+		case 3:
+			intel_perf_load_metrics_cflgt3(perf);
+			break;
+		default:
+			assert(0); /* unreachable */
+		}
+	} else if (devinfo->is_cannonlake) {
+		intel_perf_load_metrics_cnl(perf);
+	} else if (devinfo->is_icelake) {
+		intel_perf_load_metrics_icl(perf);
+	} else if (devinfo->is_elkhartlake) {
+		intel_perf_load_metrics_lkf(perf);
+	} else if (devinfo->is_tigerlake) {
+		intel_perf_load_metrics_tgl(perf);
+	} else {
+		assert(0); /* unreachable */
+	}
+
+	return perf;
+}
+
+static uint32_t
+getparam(int drm_fd, uint32_t param)
+{
+        struct drm_i915_getparam gp;
+        int val = -1;
+
+        memset(&gp, 0, sizeof(gp));
+        gp.param = param;
+        gp.value = &val;
+
+	while (ioctl(drm_fd, DRM_IOCTL_I915_GETPARAM, &gp) < 0 &&
+	       (errno == EAGAIN || errno == EINTR));
+
+        return val;
+}
+
+static bool
+read_fd_uint64(int fd, uint64_t *out_value)
+{
+	char buf[32];
+	int n;
+
+	n = read(fd, buf, sizeof (buf) - 1);
+	if (n < 0)
+		return false;
+
+	buf[n] = '\0';
+	*out_value = strtoull(buf, 0, 0);
+
+	return true;
+}
+
+static bool
+read_sysfs(int sysfs_dir_fd, const char *file_path, uint64_t *out_value)
+{
+	int fd = openat(sysfs_dir_fd, file_path, O_RDONLY);
+	bool res;
+
+	if (fd < 0)
+		return false;
+
+	res = read_fd_uint64(fd, out_value);
+	close(fd);
+
+	return res;
+}
+
+static int
+query_items(int drm_fd, struct drm_i915_query_item *items, uint32_t n_items)
+{
+	struct drm_i915_query q = {
+		.num_items = n_items,
+		.items_ptr = (uintptr_t) items,
+	};
+	int ret;
+
+	while ((ret = ioctl(drm_fd, DRM_IOCTL_I915_QUERY, &q)) < 0 &&
+	       (errno == EAGAIN || errno == EINTR));
+	return ret;
+}
+
+static struct drm_i915_query_topology_info *
+query_topology(int drm_fd)
+{
+	struct drm_i915_query_item item;
+	struct drm_i915_query_topology_info *topo_info;
+	int ret;
+
+	memset(&item, 0, sizeof(item));
+	item.query_id = DRM_I915_QUERY_TOPOLOGY_INFO;
+	ret = query_items(drm_fd, &item, 1);
+	if (ret < 0 || item.length < 0)
+		return NULL;
+
+	topo_info = calloc(1, item.length);
+	item.data_ptr = (uintptr_t) topo_info;
+	ret = query_items(drm_fd, &item, 1);
+	if (ret < 0 || item.length < 0) {
+		free(topo_info);
+		return NULL;
+	}
+
+	return topo_info;
+}
+
+static int
+open_master_sysfs_dir(int drm_fd)
+{
+	char path[128];
+	struct stat st;
+
+	if (fstat(drm_fd, &st) || !S_ISCHR(st.st_mode))
+                return -1;
+
+        snprintf(path, sizeof(path), "/sys/dev/char/%d:0",
+                 major(st.st_rdev));
+
+	return open(path, O_DIRECTORY);
+}
+
+struct intel_perf *
+intel_perf_for_fd(int drm_fd)
+{
+	uint32_t device_id = getparam(drm_fd, I915_PARAM_CHIPSET_ID);
+	uint32_t device_revision = getparam(drm_fd, I915_PARAM_REVISION);
+	uint32_t timestamp_frequency = getparam(drm_fd, I915_PARAM_CS_TIMESTAMP_FREQUENCY);
+	uint64_t gt_min_freq;
+	uint64_t gt_max_freq;
+	struct drm_i915_query_topology_info *topology;
+	struct intel_perf *ret;
+	int sysfs_dir_fd = open_master_sysfs_dir(drm_fd);
+
+	if (sysfs_dir_fd < 0)
+		return NULL;
+
+	if (!read_sysfs(sysfs_dir_fd, "gt_min_freq_mhz", &gt_min_freq) ||
+	    !read_sysfs(sysfs_dir_fd, "gt_max_freq_mhz", &gt_max_freq)) {
+		close(sysfs_dir_fd);
+		return NULL;
+	}
+	close(sysfs_dir_fd);
+
+	topology = query_topology(drm_fd);
+	if (!topology)
+		return NULL;
+
+	ret = intel_perf_for_devinfo(device_id,
+				     device_revision,
+				     timestamp_frequency,
+				     gt_min_freq * 1000000,
+				     gt_max_freq * 1000000,
+				     topology);
+	free(topology);
+
+	return ret;
+}
+
+void
+intel_perf_free(struct intel_perf *perf)
+{
+	struct intel_perf_metric_set *metric_set, *tmp;
+
+	intel_perf_logical_counter_group_free(perf->root_group);
+
+	igt_list_for_each_entry_safe(metric_set, tmp, &perf->metric_sets, link) {
+		igt_list_del(&metric_set->link);
+		intel_perf_metric_set_free(metric_set);
+	}
+
+	free(perf);
+}
+
+void
+intel_perf_add_logical_counter(struct intel_perf *perf,
+			       struct intel_perf_logical_counter *counter,
+			       const char *group_path)
+{
+	const char *group_path_end = group_path + strlen(group_path);
+	struct intel_perf_logical_counter_group *group = perf->root_group, *child_group = NULL;
+	const char *name = group_path;
+
+	while (name < group_path_end) {
+		const char *name_end = strstr(name, "/");
+		char group_name[128] = { 0, };
+		struct intel_perf_logical_counter_group *iter_group;
+
+		if (!name_end)
+			name_end = group_path_end;
+
+		memcpy(group_name, name, name_end - name);
+
+		child_group = NULL;
+		igt_list_for_each_entry(iter_group, &group->groups, link) {
+			if (!strcmp(iter_group->name, group_name)) {
+				child_group = iter_group;
+				break;
+			}
+		}
+
+		if (!child_group)
+			child_group = intel_perf_logical_counter_group_new(perf, group, group_name);
+
+		name = name_end + 1;
+		group = child_group;
+	}
+
+	igt_list_add_tail(&counter->link, &child_group->counters);
+}
+
+void
+intel_perf_add_metric_set(struct intel_perf *perf,
+			  struct intel_perf_metric_set *metric_set)
+{
+	igt_list_add_tail(&metric_set->link, &perf->metric_sets);
+}
diff --git a/lib/i915/perf.h b/lib/i915/perf.h
new file mode 100644
index 00000000..7dfa0472
--- /dev/null
+++ b/lib/i915/perf.h
@@ -0,0 +1,227 @@
+/*
+ * Copyright (C) 2015-2016 Intel Corporation
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a copy
+ * of this software and associated documentation files (the "Software"), to deal
+ * in the Software without restriction, including without limitation the rights
+ * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+ * copies of the Software, and to permit persons to whom the Software is
+ * furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+ * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+ * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+ * SOFTWARE.
+ */
+
+#ifndef PERF_METRICS_H
+#define PERF_METRICS_H
+
+#ifdef __cplusplus
+extern "C" {
+#endif
+
+#include <stdbool.h>
+#include <stdint.h>
+
+#include "igt_list.h"
+
+struct intel_device_info;
+
+struct intel_perf_devinfo {
+	char devname[20];
+	char prettyname[100];
+
+	/*
+	 * Always false for gputop, we don't have the additional
+	 * snapshots of register values, only the OA reports.
+	 */
+	bool query_mode;
+
+	bool has_dynamic_configs;
+
+	/* The following fields are prepared for equations from the XML files.
+	 * Their values are build up from the topology fields.
+	 */
+	uint32_t devid;
+	uint32_t gen;
+	uint32_t revision;
+	uint64_t timestamp_frequency;
+	uint64_t gt_min_freq;
+	uint64_t gt_max_freq;
+
+	uint64_t n_eus;
+	uint64_t n_eu_slices;
+	uint64_t n_eu_sub_slices;
+	uint64_t subslice_mask;
+	uint64_t slice_mask;
+	uint64_t eu_threads_count;
+};
+
+typedef enum {
+	INTEL_PERF_LOGICAL_COUNTER_STORAGE_UINT64,
+	INTEL_PERF_LOGICAL_COUNTER_STORAGE_UINT32,
+	INTEL_PERF_LOGICAL_COUNTER_STORAGE_DOUBLE,
+	INTEL_PERF_LOGICAL_COUNTER_STORAGE_FLOAT,
+	INTEL_PERF_LOGICAL_COUNTER_STORAGE_BOOL32,
+} intel_perf_logical_counter_storage_t;
+
+typedef enum {
+	INTEL_PERF_LOGICAL_COUNTER_TYPE_RAW,
+	INTEL_PERF_LOGICAL_COUNTER_TYPE_DURATION_RAW,
+	INTEL_PERF_LOGICAL_COUNTER_TYPE_DURATION_NORM,
+	INTEL_PERF_LOGICAL_COUNTER_TYPE_EVENT,
+	INTEL_PERF_LOGICAL_COUNTER_TYPE_THROUGHPUT,
+	INTEL_PERF_LOGICAL_COUNTER_TYPE_TIMESTAMP,
+} intel_perf_logical_counter_type_t;
+
+typedef enum {
+	/* size */
+	INTEL_PERF_LOGICAL_COUNTER_UNIT_BYTES,
+
+	/* frequency */
+	INTEL_PERF_LOGICAL_COUNTER_UNIT_HZ,
+
+	/* time */
+	INTEL_PERF_LOGICAL_COUNTER_UNIT_NS,
+	INTEL_PERF_LOGICAL_COUNTER_UNIT_US,
+
+	/**/
+	INTEL_PERF_LOGICAL_COUNTER_UNIT_PIXELS,
+	INTEL_PERF_LOGICAL_COUNTER_UNIT_TEXELS,
+	INTEL_PERF_LOGICAL_COUNTER_UNIT_THREADS,
+	INTEL_PERF_LOGICAL_COUNTER_UNIT_PERCENT,
+
+	/* events */
+	INTEL_PERF_LOGICAL_COUNTER_UNIT_MESSAGES,
+	INTEL_PERF_LOGICAL_COUNTER_UNIT_NUMBER,
+	INTEL_PERF_LOGICAL_COUNTER_UNIT_CYCLES,
+	INTEL_PERF_LOGICAL_COUNTER_UNIT_EVENTS,
+	INTEL_PERF_LOGICAL_COUNTER_UNIT_UTILIZATION,
+
+	/**/
+	INTEL_PERF_LOGICAL_COUNTER_UNIT_EU_SENDS_TO_L3_CACHE_LINES,
+	INTEL_PERF_LOGICAL_COUNTER_UNIT_EU_ATOMIC_REQUESTS_TO_L3_CACHE_LINES,
+	INTEL_PERF_LOGICAL_COUNTER_UNIT_EU_REQUESTS_TO_L3_CACHE_LINES,
+	INTEL_PERF_LOGICAL_COUNTER_UNIT_EU_BYTES_PER_L3_CACHE_LINE,
+
+	INTEL_PERF_LOGICAL_COUNTER_UNIT_MAX
+} intel_perf_logical_counter_unit_t;
+
+
+struct intel_perf;
+struct intel_perf_metric_set;
+struct intel_perf_logical_counter {
+	const struct intel_perf_metric_set *metric_set;
+	const char *name;
+	const char *symbol_name;
+	const char *desc;
+	intel_perf_logical_counter_storage_t storage;
+	intel_perf_logical_counter_type_t type;
+	intel_perf_logical_counter_unit_t unit;
+	union {
+		uint64_t (*max_uint64)(const struct intel_perf *perf,
+				       const struct intel_perf_metric_set *metric_set,
+				       uint64_t *deltas);
+		double (*max_float)(const struct intel_perf *perf,
+				    const struct intel_perf_metric_set *metric_set,
+				    uint64_t *deltas);
+	};
+
+	union {
+		uint64_t (*read_uint64)(const struct intel_perf *perf,
+					const struct intel_perf_metric_set *metric_set,
+					uint64_t *deltas);
+		double (*read_float)(const struct intel_perf *perf,
+				     const struct intel_perf_metric_set *metric_set,
+				     uint64_t *deltas);
+	};
+
+	struct igt_list_head link; /* list from intel_perf_logical_counter_group.counters */
+};
+
+struct intel_perf_register_prog {
+	uint32_t reg;
+	uint32_t val;
+};
+
+struct intel_perf_metric_set {
+	const char *name;
+	const char *symbol_name;
+	const char *hw_config_guid;
+
+	struct intel_perf_logical_counter *counters;
+	int n_counters;
+
+	uint64_t perf_oa_metrics_set;
+	int perf_oa_format;
+	int perf_raw_size;
+
+	/* For indexing into accumulator->deltas[] ... */
+	int gpu_time_offset;
+	int gpu_clock_offset;
+	int a_offset;
+	int b_offset;
+	int c_offset;
+
+	struct intel_perf_register_prog *b_counter_regs;
+	uint32_t n_b_counter_regs;
+
+	struct intel_perf_register_prog *mux_regs;
+	uint32_t n_mux_regs;
+
+	struct intel_perf_register_prog *flex_regs;
+	uint32_t n_flex_regs;
+
+	struct igt_list_head link;
+};
+
+/* A tree structure with group having subgroups and counters. */
+struct intel_perf_logical_counter_group {
+	char *name;
+
+	struct igt_list_head counters;
+	struct igt_list_head groups;
+
+	struct igt_list_head link;  /* link for intel_perf_logical_counter_group.groups */
+};
+
+struct intel_perf {
+	const char *name;
+
+	struct intel_perf_logical_counter_group *root_group;
+
+	struct igt_list_head metric_sets;
+
+	struct intel_perf_devinfo devinfo;
+};
+
+struct drm_i915_query_topology_info;
+
+struct intel_perf *intel_perf_for_fd(int drm_fd);
+struct intel_perf *intel_perf_for_devinfo(uint32_t device_id,
+					  uint32_t revision,
+					  uint64_t timestamp_frequency,
+					  uint64_t gt_min_freq,
+					  uint64_t gt_max_freq,
+					  const struct drm_i915_query_topology_info *topology);
+void intel_perf_free(struct intel_perf *perf);
+
+void intel_perf_add_logical_counter(struct intel_perf *perf,
+				    struct intel_perf_logical_counter *counter,
+				    const char *group);
+
+void intel_perf_add_metric_set(struct intel_perf *perf,
+			       struct intel_perf_metric_set *metric_set);
+
+#ifdef __cplusplus
+};
+#endif
+
+#endif /* PERF_METRICS_H */
diff --git a/lib/meson.build b/lib/meson.build
index e87e5803..4de1b211 100644
--- a/lib/meson.build
+++ b/lib/meson.build
@@ -170,4 +170,69 @@ lib_igt_perf_build = static_library('igt_perf',
 lib_igt_perf = declare_dependency(link_with : lib_igt_perf_build,
 				  include_directories : inc)
 
+
+i915_perf_files = [
+  'i915/perf.c',
+]
+
+i915_perf_hardware = [
+  'hsw',
+  'bdw', 'chv',
+  'sklgt2', 'sklgt3', 'sklgt4',
+  'kblgt2', 'kblgt3',
+  'cflgt2', 'cflgt3',
+  'bxt', 'glk',
+  'cnl',
+  'icl', 'lkf',
+  'tgl',
+]
+
+i915_xml_files = []
+foreach hw : i915_perf_hardware
+  i915_xml_files += 'i915/perf-configs/oa- at 0@.xml'.format(hw)
+endforeach
+
+i915_perf_files += custom_target(
+  'i915-perf-metrics',
+  input : i915_xml_files,
+  output : [ 'i915_perf_metrics.c', 'i915_perf_metrics.h' ],
+  command : [
+    find_program('i915/perf-configs/perf-codegen.py'),
+    '--code', '@OUTPUT0@',
+    '--header', '@OUTPUT1@',
+    '@INPUT@',
+  ])
+
+lib_igt_i915_perf_build = shared_library(
+  'i915_perf',
+  i915_perf_files,
+  dependencies: [lib_igt, lib_igt_chipset],
+  include_directories : inc,
+  install: true)
+
+lib_igt_i915_perf = declare_dependency(
+  link_with : lib_igt_i915_perf_build,
+  include_directories : inc)
+
+install_headers(
+  'igt_list.h',
+  'intel_chipset.h',
+  'i915/perf.h',
+  subdir : 'i915-perf'
+)
+
+pkgconf = configuration_data()
+
+pkgconf.set('prefix', get_option('prefix'))
+pkgconf.set('exec_prefix', '${prefix}')
+pkgconf.set('libdir', '${prefix}/@0@'.format(get_option('libdir')))
+pkgconf.set('includedir', '${prefix}/@0@'.format(get_option('includedir')))
+pkgconf.set('version', '1.0.0')
+
+configure_file(
+  input : 'i915-perf.pc.in',
+  output : 'i915-perf.pc',
+  configuration : pkgconf,
+  install_dir : pkgconfigdir)
+
 subdir('tests')
diff --git a/tools/i915-perf/i915_perf_configs.c b/tools/i915-perf/i915_perf_configs.c
new file mode 100644
index 00000000..2a0283c9
--- /dev/null
+++ b/tools/i915-perf/i915_perf_configs.c
@@ -0,0 +1,277 @@
+/*
+ * Copyright (C) 2018 Intel Corporation
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a copy
+ * of this software and associated documentation files (the "Software"), to deal
+ * in the Software without restriction, including without limitation the rights
+ * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+ * copies of the Software, and to permit persons to whom the Software is
+ * furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+ * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+ * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+ * SOFTWARE.
+ */
+
+#include <assert.h>
+#include <dirent.h>
+#include <errno.h>
+#include <fcntl.h>
+#include <getopt.h>
+#include <inttypes.h>
+#include <stdbool.h>
+#include <stdint.h>
+#include <stdio.h>
+#include <stdlib.h>
+#include <string.h>
+#include <sys/ioctl.h>
+#include <sys/sysmacros.h>
+#include <sys/types.h>
+#include <sys/stat.h>
+#include <unistd.h>
+
+#include <i915_drm.h>
+
+#include "intel_chipset.h"
+#include "i915/perf.h"
+
+static bool
+read_file_uint64(const char *file, uint64_t *value)
+{
+	char buf[32];
+	int fd, n;
+
+	fd = open(file, 0);
+	if (fd < 0)
+		return false;
+	n = read(fd, buf, sizeof (buf) - 1);
+	close(fd);
+	if (n < 0)
+		return false;
+
+	buf[n] = '\0';
+	*value = strtoull(buf, 0, 0);
+
+	return true;
+}
+
+static uint32_t
+read_device_param(const char *stem, int id, const char *param)
+{
+	char *name;
+	int ret = asprintf(&name, "/sys/class/drm/%s%u/device/%s", stem, id, param);
+	uint64_t value;
+	bool success;
+
+	assert(ret != -1);
+
+	success = read_file_uint64(name, &value);
+	free(name);
+
+	return success ? value : 0;
+}
+
+static int
+find_intel_render_node(void)
+{
+	for (int i = 128; i < (128 + 16); i++) {
+		if (read_device_param("renderD", i, "vendor") == 0x8086)
+			return i;
+	}
+
+	return -1;
+}
+
+static int
+open_render_node(uint32_t *devid)
+{
+	char *name;
+	int ret;
+	int fd;
+
+	int render = find_intel_render_node();
+	if (render < 0)
+		return -1;
+
+	ret = asprintf(&name, "/dev/dri/renderD%u", render);
+	assert(ret != -1);
+
+	*devid = read_device_param("renderD", render, "device");
+
+	fd = open(name, O_RDWR);
+	free(name);
+
+	return fd;
+}
+
+static int
+get_card_for_fd(int fd)
+{
+	struct stat sb;
+	int mjr, mnr;
+	char buffer[128];
+	DIR *drm_dir;
+	struct dirent *entry;
+	int retval = -1;
+
+	if (fstat(fd, &sb)) {
+		fprintf(stderr, "Failed to stat DRM fd\n");
+		return -1;
+	}
+
+	mjr = major(sb.st_rdev);
+	mnr = minor(sb.st_rdev);
+
+	snprintf(buffer, sizeof(buffer), "/sys/dev/char/%d:%d/device/drm", mjr, mnr);
+
+	drm_dir = opendir(buffer);
+	assert(drm_dir != NULL);
+
+	while ((entry = readdir(drm_dir))) {
+		if (entry->d_type == DT_DIR && strncmp(entry->d_name, "card", 4) == 0) {
+			retval = strtoull(entry->d_name + 4, NULL, 10);
+			break;
+		}
+	}
+
+	closedir(drm_dir);
+
+	return retval;
+}
+
+static int
+perf_ioctl(int fd, unsigned long request, void *arg)
+{
+	int ret;
+
+	do {
+		ret = ioctl(fd, request, arg);
+	} while (ret == -1 && (errno == EINTR || errno == EAGAIN));
+
+	return ret;
+}
+
+static const char *
+metric_name(struct intel_perf *perf, const char *hw_config_guid)
+{
+	struct intel_perf_metric_set *metric_set;
+
+	igt_list_for_each_entry(metric_set, &perf->metric_sets, link) {
+		if (!strcmp(metric_set->hw_config_guid, hw_config_guid))
+			return metric_set->symbol_name;
+	}
+
+	return "Unknown";
+}
+
+static void
+usage(void)
+{
+	printf("Usage: i915-perf-configs [options]\n"
+	       "Manages i915-perf configurations stored in i915.\n"
+	       "     --purge, -p         Purge configurations from the kernel\n"
+	       "     --list,  -l         List configurations from the kernel\n");
+}
+
+int
+main(int argc, char *argv[])
+{
+	char metrics_path[128];
+	DIR *metrics_dir;
+	struct dirent *entry;
+	int drm_fd, drm_card;
+	int opt;
+	bool purge = false;
+	const struct option long_options[] = {
+		{"help",   no_argument, 0, 'h'},
+		{"list",   no_argument, 0, 'l'},
+		{"purge",  no_argument, 0, 'p'},
+		{0, 0, 0, 0}
+	};
+	const struct intel_device_info *devinfo;
+	struct intel_perf *perf;
+	uint32_t devid = 0;
+
+	while ((opt = getopt_long(argc, argv, "hlp", long_options, NULL)) != -1) {
+		switch (opt) {
+		case 'h':
+			usage();
+			return EXIT_SUCCESS;
+		case 'l':
+			break;
+		case 'p':
+			purge = true;
+			break;
+		default:
+			fprintf(stderr, "Internal error: "
+				"unexpected getopt value: %d\n", opt);
+			usage();
+			return EXIT_FAILURE;
+		}
+	}
+
+	drm_fd = open_render_node(&devid);
+	drm_card = get_card_for_fd(drm_fd);
+
+	fprintf(stdout, "Found device id=0x%x\n", devid);
+
+	devinfo = intel_get_device_info(drm_fd);
+	if (!devinfo) {
+		fprintf(stderr, "No device info found.\n");
+		return EXIT_FAILURE;
+	}
+
+	fprintf(stdout, "Device gen=%i gt=%i\n", devinfo->gen, devinfo->gt);
+
+	perf = intel_perf_for_fd(drm_fd);
+	if (!perf) {
+		fprintf(stderr, "No perf data found.\n");
+		return EXIT_FAILURE;
+	}
+
+	snprintf(metrics_path, sizeof(metrics_path),
+		 "/sys/class/drm/card%d/metrics", drm_card);
+	metrics_dir = opendir(metrics_path);
+	if (!metrics_dir)
+		return EXIT_FAILURE;
+
+	fprintf(stdout, "Looking at metrics in %s\n", metrics_path);
+
+	while ((entry = readdir(metrics_dir))) {
+		char metric_id_path[400];
+		uint64_t metric_id;
+
+		if (entry->d_type != DT_DIR)
+			continue;
+
+		snprintf(metric_id_path, sizeof(metric_id_path),
+			 "%s/%s/id", metrics_path, entry->d_name);
+
+		if (!read_file_uint64(metric_id_path, &metric_id))
+			continue;
+
+		if (purge) {
+			if (perf_ioctl(drm_fd, DRM_IOCTL_I915_PERF_REMOVE_CONFIG, &metric_id) == 0)
+				fprintf(stdout, "\tRemoved config %s id=%03" PRIu64 " name=%s\n",
+					entry->d_name, metric_id, metric_name(perf, entry->d_name));
+			else
+				fprintf(stdout, "\tFailed to remove config %s id=%03" PRIu64 " name=%s\n",
+					entry->d_name, metric_id, metric_name(perf, entry->d_name));
+		} else {
+			fprintf(stdout, "\tConfig %s id=%03" PRIu64 " name=%s\n",
+				entry->d_name, metric_id, metric_name(perf, entry->d_name));
+		}
+	}
+
+	closedir(metrics_dir);
+	close(drm_fd);
+
+	return EXIT_SUCCESS;
+}
diff --git a/tools/i915-perf/meson.build b/tools/i915-perf/meson.build
new file mode 100644
index 00000000..0ebdd185
--- /dev/null
+++ b/tools/i915-perf/meson.build
@@ -0,0 +1,5 @@
+executable('i915-perf-configs',
+           [ 'i915_perf_configs.c' ],
+           include_directories: inc,
+           dependencies: [lib_igt_chipset, lib_igt_i915_perf],
+           install: true)
diff --git a/tools/meson.build b/tools/meson.build
index cf3f37b2..59b56d5d 100644
--- a/tools/meson.build
+++ b/tools/meson.build
@@ -100,4 +100,5 @@ executable('amd_hdmi_compliance', 'amd_hdmi_compliance.c',
 	   install_rpath : bindir_rpathdir,
 	   install : true)
 
+subdir('i915-perf')
 subdir('null_state_gen')
-- 
2.25.0



More information about the igt-dev mailing list